[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$fywMUXZ2fAmknW4CUF6-Syo6cpcgRGaSBANI_1iLUnFU":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":12,"question":15,"related":16,"source":20,"type":21},[],"2024-11-25 09:45:47",999757153,[8,9,10,11],"蒙特卡洛法","梯度下降法","牛顿法","时序差分法",{"courseImg":13,"courseName":14},"https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002Fcf3bb414b5ea2367f316b2d3561124c7.jpg","[共享课]人工智能","强化学习的近似的策略评估中,计算真值的方法有( )",[17],{"answer":18,"createTime":5,"id":6,"options":19,"question":15,"source":20,"type":21},[],[8,9,10,11],"v2",1]