[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$fSIEKMeMpkaNocxY1xbVS5kppqflOM3dDcytQSlQFObg":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":12,"question":19,"related":20,"source":31,"type":32},[],"2025-11-24 13:40:32",240747191,[8,9,10,11],"交叉熵=熵*KL散度","交叉熵=-熵+KL散度","交叉熵=熵+KL散度","交叉熵=熵\u002FKL散度",{"count":13,"courseId":14,"courseImg":15,"courseName":16,"workId":17,"workName":18},104,"53e1d2ef4961cca8eea3e23969ad2cb9","https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F03a579384a6dc297c89809b582fcc767.png","默认课程","work_46198252","作业10(3.3)","对于交叉熵和KL散度关系,以下最有可能正确的是( )",[21,33,42,51,60,69,78,87,96,105],{"answer":22,"createTime":23,"id":24,"options":25,"question":30,"source":31,"type":32},[],"2025-12-11 20:06:51",240747168,[26,27,28,29],"该动作在状态s下必然导致失败","执行该动作后,长期累积奖励的期望为负","环境对该动作的即时奖励一定为负","该状态s下没有任何有价值的动作","如果某一&quot;状态-动作对&quot;(s,a)的Q值为负,说明( )","v1",0,{"answer":34,"createTime":23,"id":35,"options":36,"question":41,"source":31,"type":32},[],240747169,[37,38,39,40],"K-means聚类","线性回归","决策树","最近邻方法","对于下图中的x和y之间关系的建模,最适合的方法是( ). \u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F7d71404c5a367fdb356eed1634901647.png\">",{"answer":43,"createTime":23,"id":44,"options":45,"question":50,"source":31,"type":32},[],240747170,[46,47,48,49],"平均值","为0的值","较大的值","较小的值","在实际应用中,找到损失函数的最小值非常困难,找到一个令人满意的( )就可以了",{"answer":52,"createTime":23,"id":53,"options":54,"question":59,"source":31,"type":32},[],240747171,[55,56,57,58],"学生在课堂上听老师讲解数学公式并做习题","机器人在迷宫中不断探索,找到出口后获得奖励","利用标注好的图片训练图像识别模型","程序员手动编写代码实现特定功能","下列( )学习方式最能体现强化学习的试错特性",{"answer":61,"createTime":23,"id":62,"options":63,"question":68,"source":31,"type":32},[],240747172,[64,65,66,67],"树突","激励函数","加权处理","输出矩阵","以下最不可能是人工神经元组成部分的是( )",{"answer":70,"createTime":23,"id":71,"options":72,"question":77,"source":31,"type":32},[],240747173,[73,74,75,76],"Conv","Adam","SGD","AdamW","需要手动调节学习率的优化器是( )",{"answer":79,"createTime":23,"id":80,"options":81,"question":86,"source":31,"type":32},[],240747174,[82,83,84,85],"10万","1亿","100","1000亿","以下对人脑神经元数量量级估计最正确的是( )",{"answer":88,"createTime":23,"id":89,"options":90,"question":95,"source":31,"type":32},[],240747175,[91,92,93,94],"模型在测试集上表现一定越好","模型在所有数据上预测结果越接近真实结果","模型在训练集上预测结果越接近标签","模型性能所有数据上一定越差","模型训练集上的平均损失函数越小说明( )",{"answer":97,"createTime":23,"id":98,"options":99,"question":104,"source":31,"type":32},[],240747176,[100,101,102,103],"定义环境的初始状态","决定智能体在给定状态下选择哪个动作","计算环境给予的奖励值","记录智能体的所有历史动作","&quot;策略(Policy)&quot;在强化学习中扮演的角色是( )",{"answer":106,"createTime":23,"id":107,"options":108,"question":113,"source":31,"type":32},[],240747177,[109,110,111,112],"0","0.1","0.2","0.3","为了防止出现梯度消失,一般训练前初始化神经参数时,最不宜将参数初始化为( )"]