[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$fQBLhDIG3J1JIxDE1fOtA1GoUoxD8vHL_AQ-b9BcK7cU":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":12,"question":19,"related":20,"source":30,"type":31},[],"2025-12-11 20:06:51",240747174,[8,9,10,11],"10万","1亿","100","1000亿",{"count":13,"courseId":14,"courseImg":15,"courseName":16,"workId":17,"workName":18},104,"53e1d2ef4961cca8eea3e23969ad2cb9","https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F03a579384a6dc297c89809b582fcc767.png","默认课程","work_46198252","作业10(3.3)","以下对人脑神经元数量量级估计最正确的是( )",[21,32,41,50,59,68,77,80,89,98],{"answer":22,"createTime":5,"id":23,"options":24,"question":29,"source":30,"type":31},[],240747168,[25,26,27,28],"该动作在状态s下必然导致失败","执行该动作后,长期累积奖励的期望为负","环境对该动作的即时奖励一定为负","该状态s下没有任何有价值的动作","如果某一&quot;状态-动作对&quot;(s,a)的Q值为负,说明( )","v1",0,{"answer":33,"createTime":5,"id":34,"options":35,"question":40,"source":30,"type":31},[],240747169,[36,37,38,39],"K-means聚类","线性回归","决策树","最近邻方法","对于下图中的x和y之间关系的建模,最适合的方法是( ). \u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F7d71404c5a367fdb356eed1634901647.png\">",{"answer":42,"createTime":5,"id":43,"options":44,"question":49,"source":30,"type":31},[],240747170,[45,46,47,48],"平均值","为0的值","较大的值","较小的值","在实际应用中,找到损失函数的最小值非常困难,找到一个令人满意的( )就可以了",{"answer":51,"createTime":5,"id":52,"options":53,"question":58,"source":30,"type":31},[],240747171,[54,55,56,57],"学生在课堂上听老师讲解数学公式并做习题","机器人在迷宫中不断探索,找到出口后获得奖励","利用标注好的图片训练图像识别模型","程序员手动编写代码实现特定功能","下列( )学习方式最能体现强化学习的试错特性",{"answer":60,"createTime":5,"id":61,"options":62,"question":67,"source":30,"type":31},[],240747172,[63,64,65,66],"树突","激励函数","加权处理","输出矩阵","以下最不可能是人工神经元组成部分的是( )",{"answer":69,"createTime":5,"id":70,"options":71,"question":76,"source":30,"type":31},[],240747173,[72,73,74,75],"Conv","Adam","SGD","AdamW","需要手动调节学习率的优化器是( )",{"answer":78,"createTime":5,"id":6,"options":79,"question":19,"source":30,"type":31},[],[8,9,10,11],{"answer":81,"createTime":5,"id":82,"options":83,"question":88,"source":30,"type":31},[],240747175,[84,85,86,87],"模型在测试集上表现一定越好","模型在所有数据上预测结果越接近真实结果","模型在训练集上预测结果越接近标签","模型性能所有数据上一定越差","模型训练集上的平均损失函数越小说明( )",{"answer":90,"createTime":5,"id":91,"options":92,"question":97,"source":30,"type":31},[],240747176,[93,94,95,96],"定义环境的初始状态","决定智能体在给定状态下选择哪个动作","计算环境给予的奖励值","记录智能体的所有历史动作","&quot;策略(Policy)&quot;在强化学习中扮演的角色是( )",{"answer":99,"createTime":5,"id":100,"options":101,"question":106,"source":30,"type":31},[],240747177,[102,103,104,105],"0","0.1","0.2","0.3","为了防止出现梯度消失,一般训练前初始化神经参数时,最不宜将参数初始化为( )"]