[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$ffceMrrUdtJy34iLzFx6-4CR_tXDy6RB-OOoiuI1cQnU":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":10,"question":16,"related":17,"source":27,"type":51},[],"2024-10-25 12:45:34",999757671,[8,9],"对","错",{"courseId":11,"courseImg":12,"courseName":13,"workId":14,"workName":15},"1000000860","https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fcf3bb414b5ea2367f316b2d3561124c7.jpg","[共享课]人工智能","59023987","第七章单元测试","在强化学习值函数近似中,蒙特卡洛方法中可以使用SARSA和Q-learning进行真值的学习( )",[18,29,39,48,52],{"answer":19,"createTime":5,"id":20,"options":21,"question":26,"source":27,"type":28},[],999757634,[22,23,24,25],"减少内存的消耗","复杂的计算获得更精确的表示","可以采样更多的样本","可以减少采样","使用强化学习状态的泛化表示的好处有( )","v2",1,{"answer":30,"createTime":5,"id":31,"options":32,"question":37,"source":27,"type":38},[],999757641,[33,34,35,36],"\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fc64c76f174de69d7b1330a638b030ddc.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F19233f93055b2f45980b959d23a149df.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fc51e86d2b2e90bf3dbb005801b358c43.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fd4019a2887a154a93aa69a666dd1eeeb.jpg\">","在强化学习值函数近似中,蒙特卡洛方法对梯度计算是( )",0,{"answer":40,"createTime":5,"id":41,"options":42,"question":47,"source":27,"type":38},[],999757647,[43,44,45,46],"\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F2a68f4ad04fb5fd5de8da534e317c32e.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F024b795e664adf5f4d4b3199b689853f.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fcad0f1810075051feeca28416236d7cb.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fb5c5404c1fc961404ea95003dac2cd55.jpg\">","在强化学习值函数近似中,时间差分方法对梯度计算是( )",{"answer":49,"createTime":5,"id":6,"options":50,"question":16,"source":27,"type":51},[],[8,9],3,{"answer":53,"createTime":5,"id":54,"options":55,"question":56,"source":27,"type":51},[],999757673,[8,9],"强化学习中有有模型的方法和无模型的方法( )"]