[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$foJApZzrbefVYqeKmJrFKIHMFP187MEtSwWqmIcr1zp8":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":12,"question":18,"related":19,"source":29,"type":40},[],"2024-10-25 12:45:34",999757647,[8,9,10,11],"\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F2a68f4ad04fb5fd5de8da534e317c32e.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F024b795e664adf5f4d4b3199b689853f.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fcad0f1810075051feeca28416236d7cb.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fb5c5404c1fc961404ea95003dac2cd55.jpg\">",{"courseId":13,"courseImg":14,"courseName":15,"workId":16,"workName":17},"1000000860","https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fcf3bb414b5ea2367f316b2d3561124c7.jpg","[共享课]人工智能","59023987","第七章单元测试","在强化学习值函数近似中,时间差分方法对梯度计算是( )",[20,31,41,44,52],{"answer":21,"createTime":5,"id":22,"options":23,"question":28,"source":29,"type":30},[],999757634,[24,25,26,27],"减少内存的消耗","复杂的计算获得更精确的表示","可以采样更多的样本","可以减少采样","使用强化学习状态的泛化表示的好处有( )","v2",1,{"answer":32,"createTime":5,"id":33,"options":34,"question":39,"source":29,"type":40},[],999757641,[35,36,37,38],"\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fc64c76f174de69d7b1330a638b030ddc.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F19233f93055b2f45980b959d23a149df.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fc51e86d2b2e90bf3dbb005801b358c43.jpg\">","\u003Cimg src=\"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fd4019a2887a154a93aa69a666dd1eeeb.jpg\">","在强化学习值函数近似中,蒙特卡洛方法对梯度计算是( )",0,{"answer":42,"createTime":5,"id":6,"options":43,"question":18,"source":29,"type":40},[],[8,9,10,11],{"answer":45,"createTime":5,"id":46,"options":47,"question":50,"source":29,"type":51},[],999757671,[48,49],"对","错","在强化学习值函数近似中,蒙特卡洛方法中可以使用SARSA和Q-learning进行真值的学习( )",3,{"answer":53,"createTime":5,"id":54,"options":55,"question":56,"source":29,"type":51},[],999757673,[48,49],"强化学习中有有模型的方法和无模型的方法( )"]