[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$f3w2oT1M0rFw2flRzgU8wisATXJdfoToIzWRtKwBiBaw":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":12,"question":19,"related":20,"source":28,"type":33},[],"2025-10-22 08:35:32",223326789,[8,9,10,11],"状态和行为维度高","状态信息误差大","现有模型限制","样本量过大,计算复杂",{"count":13,"courseId":14,"courseImg":15,"courseName":16,"workId":17,"workName":18},4,"53e1d2ef4961cca8eea3e23969ad2cb9","https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F03a579384a6dc297c89809b582fcc767.png","默认课程","cc3532fc23fe4a1da211d554e4deaec2","5.4","强化学习的难点有( )",[21,30,34,43],{"answer":22,"createTime":5,"id":23,"options":24,"question":27,"source":28,"type":29},[],223326788,[8,9,25,26],"样本量过多","模型限制","下列不属于强化学习难点的是( )","v1",0,{"answer":31,"createTime":5,"id":6,"options":32,"question":19,"source":28,"type":33},[],[8,9,10,11],1,{"answer":35,"createTime":5,"id":36,"options":37,"question":42,"source":28,"type":33},[],223326790,[38,39,40,41],"深度学习的训练样本是有标签的,而强化学习没有","深度学习的学习过程是静态的,而强化学习是动态的","深度学习解决的更多是感知问题,强化学习解决的主要是决策问题","深度学习部分有有监督学习和无监督学习之分,强化学习无此分类","深度学习与强化学习的区别有哪些( )",{"answer":44,"createTime":5,"id":45,"options":46,"question":51,"source":28,"type":33},[],223326791,[47,48,49,50],"基于价值的强化学习(Value-based RL)","基于策略的强化学习(Policy-based RL)","深度强化学习(DRL)","逆强化学习(Inverse RL)","强化学习的方法主要有( )"]