[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"$ffbOLlQwV1caXaCr975Yz3N5JZ71tMmlC8a_3Z9VCLFs":3},{"answer":4,"createTime":5,"id":6,"options":7,"origin":12,"question":19,"related":20,"source":30,"type":31},[],"2024-06-16 17:17:07",152057250,[8,9,10,11],"CRF","Word2Vec","LSTM","BERT",{"count":13,"courseId":14,"courseImg":15,"courseName":16,"workId":17,"workName":18},64,"c49fd4b586de147b5e3f29516c5bcb62","https:\u002F\u002Ftihai-oss-cloud.itihey.com\u002Fimg\u002F9c1e48361b00f3ee2086f4e259ed792b.jpg","自然语言处理与知识图谱技术","exam_124583319","2023-2024第二学期人工智能22级期末模拟考试","下列哪个是常见的词向量模型",[21,32,41,50,59,62,71,81,90,99],{"answer":22,"createTime":5,"id":23,"options":24,"question":29,"source":30,"type":31},[],152057246,[25,26,27,28],"情感分析","文档归类","垃圾邮件过滤","机器翻译","下列哪项不是自然语言处理中文本分类(Text Classification)的常见应用之一","v1",0,{"answer":33,"createTime":5,"id":34,"options":35,"question":40,"source":30,"type":31},[],152057247,[36,37,38,39],"字序上的理解","语言上的理解","语音上的理解","语义上的理解","要想提取出&quot;有用&quot;的信息,仅提取关键词、统计词频等是远远不够的,必须对用户数据(尤其是发言、评论等)进行()",{"answer":42,"createTime":5,"id":43,"options":44,"question":49,"source":30,"type":31},[],152057248,[45,46,47,48],"关闭隐马尔可夫模型进行分词","进行关键词提取","开启隐马尔可夫模型进行新词发现","启用用户词典进行分词","在使用Jieba的jieba.cut()函数时,参数HMM设置为True的作用是什么",{"answer":51,"createTime":5,"id":52,"options":53,"question":58,"source":30,"type":31},[],152057249,[54,55,56,57],"window","min_count","epochs","size","在使用gensim库进行Word2Vec模型训练时,以下哪个参数用于指定训练数据的迭代次数",{"answer":60,"createTime":5,"id":6,"options":61,"question":19,"source":30,"type":31},[],[8,9,10,11],{"answer":63,"createTime":5,"id":64,"options":65,"question":70,"source":30,"type":31},[],152057251,[66,67,68,69],"re.search(pattern, string)","re.sub(pattern, repl, string)","re.match(pattern, string)","re.findall(pattern, string)","re模块支持正则表达式,用于检测字符串开头位置是否匹配模式pattern的函数是:",{"answer":72,"createTime":73,"id":74,"options":75,"question":80,"source":30,"type":31},[],"2024-06-16 17:17:08",152057252,[76,77,78,79],"N元文法","一元文法","数据平滑","一元切分","在统计语言模型中,通常以概率的形式描述任意语句的可能性,利用最大相似度估计进行度量,对于一些低频词,无论如何扩大训练数据,出现的频度仍然很低,下列哪种方法可以解决这一问题()",{"answer":82,"createTime":73,"id":83,"options":84,"question":89,"source":30,"type":31},[],152057253,[85,86,87,88],"图灵机器人","数据挖掘","百度翻译","微信语音转文字","不属于 NLP 应用场景的是()",{"answer":91,"createTime":73,"id":92,"options":93,"question":98,"source":30,"type":31},[],152057254,[94,95,96,97],"去停用词","语料预处理","词性标注","中文分词","中文 NLP 的基本流程由语料获取、()、文本向量化、模型构建、模型训练和 模型评价 6部分组成",{"answer":100,"createTime":73,"id":101,"options":102,"question":107,"source":30,"type":31},[],152057255,[103,104,105,106],"命名实体识别(Named Entity Recognition)","停用词消除(Stop Word Removal)","词干提取(Stemming)","词形还原(Lemmatization)","从给定的句子、段落中识别人名、组织名的过程称为"]