[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$fekJGxL6v5B6NAPKz1dYSVX_w9B1b-_fJ8GtgITUn3Ng":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":12,"question":19,"related":20,"source":31,"type":32},[],"2024-06-16 17:17:08",152057252,[8,9,10,11],"N元文法","一元文法","数据平滑","一元切分",{"count":13,"courseId":14,"courseImg":15,"courseName":16,"workId":17,"workName":18},64,"c49fd4b586de147b5e3f29516c5bcb62","https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F9c1e48361b00f3ee2086f4e259ed792b.jpg","自然语言处理与知识图谱技术","exam_124583319","2023-2024第二学期人工智能22级期末模拟考试","在统计语言模型中,通常以概率的形式描述任意语句的可能性,利用最大相似度估计进行度量,对于一些低频词,无论如何扩大训练数据,出现的频度仍然很低,下列哪种方法可以解决这一问题()",[21,33,42,51,60,69,78,81,90,99],{"answer":22,"createTime":23,"id":24,"options":25,"question":30,"source":31,"type":32},[],"2024-06-16 17:17:07",152057246,[26,27,28,29],"情感分析","文档归类","垃圾邮件过滤","机器翻译","下列哪项不是自然语言处理中文本分类(Text Classification)的常见应用之一","v1",0,{"answer":34,"createTime":23,"id":35,"options":36,"question":41,"source":31,"type":32},[],152057247,[37,38,39,40],"字序上的理解","语言上的理解","语音上的理解","语义上的理解","要想提取出&quot;有用&quot;的信息,仅提取关键词、统计词频等是远远不够的,必须对用户数据(尤其是发言、评论等)进行()",{"answer":43,"createTime":23,"id":44,"options":45,"question":50,"source":31,"type":32},[],152057248,[46,47,48,49],"关闭隐马尔可夫模型进行分词","进行关键词提取","开启隐马尔可夫模型进行新词发现","启用用户词典进行分词","在使用Jieba的jieba.cut()函数时,参数HMM设置为True的作用是什么",{"answer":52,"createTime":23,"id":53,"options":54,"question":59,"source":31,"type":32},[],152057249,[55,56,57,58],"window","min_count","epochs","size","在使用gensim库进行Word2Vec模型训练时,以下哪个参数用于指定训练数据的迭代次数",{"answer":61,"createTime":23,"id":62,"options":63,"question":68,"source":31,"type":32},[],152057250,[64,65,66,67],"CRF","Word2Vec","LSTM","BERT","下列哪个是常见的词向量模型",{"answer":70,"createTime":23,"id":71,"options":72,"question":77,"source":31,"type":32},[],152057251,[73,74,75,76],"re.search(pattern, string)","re.sub(pattern, repl, string)","re.match(pattern, string)","re.findall(pattern, string)","re模块支持正则表达式,用于检测字符串开头位置是否匹配模式pattern的函数是:",{"answer":79,"createTime":5,"id":6,"options":80,"question":19,"source":31,"type":32},[],[8,9,10,11],{"answer":82,"createTime":5,"id":83,"options":84,"question":89,"source":31,"type":32},[],152057253,[85,86,87,88],"图灵机器人","数据挖掘","百度翻译","微信语音转文字","不属于 NLP 应用场景的是()",{"answer":91,"createTime":5,"id":92,"options":93,"question":98,"source":31,"type":32},[],152057254,[94,95,96,97],"去停用词","语料预处理","词性标注","中文分词","中文 NLP 的基本流程由语料获取、()、文本向量化、模型构建、模型训练和 模型评价 6部分组成",{"answer":100,"createTime":5,"id":101,"options":102,"question":107,"source":31,"type":32},[],152057255,[103,104,105,106],"命名实体识别(Named Entity Recognition)","停用词消除(Stop Word Removal)","词干提取(Stemming)","词形还原(Lemmatization)","从给定的句子、段落中识别人名、组织名的过程称为"]