[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$f_GOVoBLy5l9iBlJnCVWN7dxvdjOSuCoBiPQWmgQcVaA":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":12,"question":19,"related":20,"source":30,"type":39},[],"2025-10-22 08:35:32",223326790,[8,9,10,11],"深度学习的训练样本是有标签的,而强化学习没有","深度学习的学习过程是静态的,而强化学习是动态的","深度学习解决的更多是感知问题,强化学习解决的主要是决策问题","深度学习部分有有监督学习和无监督学习之分,强化学习无此分类",{"count":13,"courseId":14,"courseImg":15,"courseName":16,"workId":17,"workName":18},4,"53e1d2ef4961cca8eea3e23969ad2cb9","https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F03a579384a6dc297c89809b582fcc767.png","默认课程","cc3532fc23fe4a1da211d554e4deaec2","5.4","深度学习与强化学习的区别有哪些( )",[21,32,40,43],{"answer":22,"createTime":5,"id":23,"options":24,"question":29,"source":30,"type":31},[],223326788,[25,26,27,28],"状态和行为维度高","状态信息误差大","样本量过多","模型限制","下列不属于强化学习难点的是( )","v1",0,{"answer":33,"createTime":5,"id":34,"options":35,"question":38,"source":30,"type":39},[],223326789,[25,26,36,37],"现有模型限制","样本量过大,计算复杂","强化学习的难点有( )",1,{"answer":41,"createTime":5,"id":6,"options":42,"question":19,"source":30,"type":39},[],[8,9,10,11],{"answer":44,"createTime":5,"id":45,"options":46,"question":51,"source":30,"type":39},[],223326791,[47,48,49,50],"基于价值的强化学习(Value-based RL)","基于策略的强化学习(Policy-based RL)","深度强化学习(DRL)","逆强化学习(Inverse RL)","强化学习的方法主要有( )"]