{“状态”:“确定”,“消息类型”:“工作”,“信息版本”:“1.0.0”,“邮件”:{“索引”:{“日期部分”:[[2024,2,13]],“日期时间”:“2024-02-13T11:02:18Z”,“时间戳”:1707822138846},“出版商位置”:“柏林,海德堡”,“参考计数”:11,“出版者”:“施普林格-柏林-海德堡(Springer Berlin Heidelberg)”,“isbn-type”:[{“值”:“9783642235375”,“类型”:“打印”},{“值”:“9783642235382”,“type”:“electronic”}],“license”:[{“start”:{“date-parts”:[[2011,1,1]],“date-time”:“2011-01-01T00:00:00Z”,“timestamp”:1293840000000},“content-version”:“unspecified”,“delay-in-days”:0,“URL”:“http://\www.springer.com\/tdm”},{“开始”:{“date-ports”:[2011,1,1,1],“日期-时间”:“2011-01-01T00:00:00Z”,“时间戳”:1293840000000},“content-version”:“unspecified”,“delay-in-days”:0,“URL”:“http://www.springer.com//tdm”}],“content-domain”:{“domain”:[],“crossmark-restriction”:false},“short-container-title”:[],”published-print“:{”date-parts“:[[2011]]},”DOI“:”10.1007\/978-3642-23538-250“,”type“:”book-capter“,”created“:”{“date-part”:[[2011,8,27]],“日期时间”:“2011-08-27T07:11:37Z”,“时间戳”:1314429097000},“页面”:“395-402”,“来源”:“Crossref”,“is-referenced-by-count”:21,“标题”:[“hrWaC and slWac:Compiling Web Corpora for Croatian and Slovene”],“前缀”:“10.1007”,”作者:[{“given”:“Nikola”,“family”:“Ljube\u0161i\u0107”,“sequence”:“first”,“affiliation”:[]},{“given”:“Toma\u017e”,“family”:“Erjavec”,“sequence”:“additional”,“affiliation”:[]}],“member”:“297”,“reference”:[{“issue”:“3”,“key”:“50_CR1”,“doi-asserted-by”:“publisher”,”first page“:”209“,”doi“:”10.1007\/s10579-009-9081-4“,”volume“:“43”,“author”:“M.Baroni“,”year“:”2009“,”unstructured“:“Baroni,M.,Bernardini,S.,Ferraresi,A.,Zanchetta,E.:WaCky wide web:一个非常大的语言处理网络搜索语料库的集合。语言资源和评估\u00a043(3),209\u2013226(2009)”,“新闻标题”:“语言资源和评价”},{“key”:“50_CR2”,“非结构化”:“Guevara,E.:NoWaC:一个大型的基于网络的挪威语料库。In:NAACL HLT 2010第六届网络语料库研讨会,pp.1\u20137(2010)”},{“key”:“50_CR3”,“unstructured”:“Spoustov,D.,Spousta,M.,Pecina,P.:构建捷克语的网络语料集。In:Seventh Intl.Conf.on Language Resources and Evaluation,LREC 2010:“Sharoff,S.:分析语料库之间的异同。In:7th Conference\u201dLanguage Technologies\u201d,Jo\u017eef Stefan Institute,卢布尔雅那,pp.5\u201311(2010)”},{“key”:“50_CR5”,“doi-asserted-by”:“crossref”,“unstructured”:“Kohlsch\u00fctter,C.,Fankhauser,P.,Nejdl,W.:使用浅文本特征进行Boilerplate检测。摘自:WSDM 2010,pp.441\u2013450(2010)”,“DOI”:“10.1145\/1718487.1718542”},{“key”:“50_CR6”,“unstructured”:“Stupar,M.,Juri\u0107,T.,Ljube\u0161i\u0106,N.:构建语言语料库的网络数据语言识别。In:2011年信息会议论文集(正在出版)”},{“key”:“50_CR7”,“unstructured”:“Agi\u0107,\u017d.,Tadi\u0108,M.:评估克罗地亚语文本的形态句法标记。In:Fifth Intl。Conf.on Language Resources and Evaluation(2006)“},{”issue“:“3”,”key“:“50_CR8”,”first page“:”253”,“volume”:“15”,“author”:“T.Erjavec”,“year”:“2005”,“unstructured”:“Erjavec,T.,Ignat,C.,Pouligen,B.,Steinberger,R.:大规模多语言语料库编译:Acquis Communataire and ToTaLe.控制科学档案\u00a015(3),253\u2013264(2005)“,”journal-title“:”Archives of Control Sciences“},{“key”:“50_CR9”,“unstructured”:“Erjavec,T.,Krek,S.:斯洛文尼亚语的JOS形态句法标记语料库。In:Sixth Intl.Conf.on Language Resources and Evaluation(2008)”},“key“:”50_CR10“,”unstructure“:”Erjavec,T.:MULTEXT-最新版本4:多语言形态句法规范,词汇和语料库。In:Seventh Intl.Conf.on Language Resources and Evaluation(2010)“},{”key“:”50_CR11“,”nonstructured“:”McCallum,A.K.:MALLET:A Machine Learning for Language Toolkit(2002),\n\nhttp:\/\/MALLET.cs.umass.edu“}],”container title“:[”文本、语音和对话“,”计算机科学讲义“],”original-title“:[],”link“:[{”URL“:”http://\/link.springer.com/content\/pdf\/10.1007\/978-3642-23538-250“,”content-type“:”unspecified“,”content-version“:”vor“,”intended-application“:”similarity-checking“}],”deposed“:{”date-parts“:[2019,4,1]],”date-time“:“2019-04-01T12:24:14Z”,“timestamp”:155412145000},“score”:1,“资源”:{“主”:{“URL”:“http://\/link.springer.com/10.1007\/978-3642-23538-250“}},”副标题“:[],”短标题“:[],”已发布“:{”日期-部件“:[[2011]]},“ISBN”:[“9783642235375”,“978364 2235382”],”参考计数“:11,”URL“http://\/dx.doi.org\/10.10007\/978-3642-23538-2_50”,“关系”:{},:[“0302-9743”,“1611-3349”],“ISSN-type”:[{“value”:“0302-7743”value“:“1611-3349”,“type”:“electronic”}],“subject”:[],“published”:{“date-parts”:[[2011]]}}