{“id”:“https://openalex.org/W2797980629“,”doi“:”https://doi.org/10.109/icsc.2018.00045“,”title“:”科学知识库建设的数据采集和信息提取“,”display_name“:”科技知识库建设中的数据采集与信息提取“;”publication_year“:2018,”publication_date“:”2018-01-01“,”ids“:{”openalex“:”https://openalex.org/W2797980629“,”doi“:”https://doi.org/10.109/icsc.2018.00045“,”mag“:”2797980629“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/icsc.2018.00045“,”pdf_url“:null,”source“:null,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:false,”oa_status“:”closed“,”oa_url”:null“,”any_repository_has_fulltext“:false}”,”authorships“:[{”author_position“:”first“,”作者“:{”id“:”https://openalex.org/A5057496609“,”display_name“:”Piotr Andruszkiewicz“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I108403487“,”display_name“:”华沙理工大学“,”ror“:”https://ror.org/00y0xnp53“,”country_code“:”PL“,”type“:“教育”,”世系“:[”https://openalex.org/I108403487“]},{”id“:”https://openalex.org/I4210087266“,”display_name“:”计算机科学研究所“,”ror“:”https://ror.org/003fvp964“,”国家代码“:”PL“,”类型“:”设施“,”沿袭“:[”https://openalex.org/I4210087266","https://openalex.org/I99542240“]}],”国家“:[”PL“],”is_corresponding“:false,”raw_author_name“:”Piotr Andruszkiewicz“,”raw _ afiliation_strings“:[“波兰华沙华沙理工大学计算机科学研究所”],”affiliations“:[{”raw _affiliation_strong“:”波兰华沙科技大学计算机科学学院”,“institution_ids”:[“https://openalex.org/I108403487","https://openalex.org/I4210087266“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5027943585“,”display_name“:”Henryk Rybi\u0144ski“,”orcid“:”https://orcid.org/0000-0002-2890-7080},“机构”:[{“id”:https://openalex.org/I108403487“,”display_name“:”华沙理工大学“,”ror“:”https://ror.org/00y0xnp53“,”country_code“:”PL“,”type“:“教育”,”世系“:[”https://openalex.org/I108403487“]},{”id“:”https://openalex.org/I4210087266“,”display_name“:”计算机科学研究所“,”ror“:”https://ror.org/003fvp964“,”国家代码“:”PL“,”类型“:”设施“,”沿袭“:[”https://openalex.org/I4210087266","https://openalex.org/I99542240“]}],”国家“:[”PL“],”is_corresponding“:false,”raw_author_name“:”Henryk Rybinski“,”raw _ afiliation_strings“:[“波兰华沙理工大学计算机科学研究所”],”affiliations“:[{”raw _affiliation_strong“:”波兰华沙科技大学计算机科学学院”,“institution_ids”:[“https://openalex.org/I108403487","https://openalex.org/I4210087266“]}]}],”countries_distinct_count“:1,”institutions_disting_count”:2,”corresponding_author_ids“:[],”corresponding_institution_ids”:[]、“apc_list”:null,”apc_payd“:null、”has_fulltext“:true、”fulltext_origin“:”ngrams“,”cited_by_count:3,“cited_by_percentile_year”:{“min”:78,”max“:80},”biblio“:{”volume“:nul”,“issue”:null,“first_page”:null,“last_page”:null},“is_retracted”:false,“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T2016“,”display_name“:”Web数据提取和爬网技术“,”score“:0.9999,”subfield“:{”id“:”https://openalex.org/subfields/1710“,”display_name“:”Information Systems“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”Physical Sciences“}},”topics“:[{”id“:”https://openalex.org/T2016“,”“display_name”:“Web数据提取和爬网技术”,“score”:0.9999,“subfield”:{“id”:“https://openalex.org/subfields/1710“,”display_name“:”Information Systems“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11719“,”display_name“:”数据质量评估和改进“,”score“:0.9906,”subfield“:{”id“:”https://openalex.org/subfields/1803“,”display_name“:”管理科学与运筹学“},”字段“:{”id“:”https://openalex.org/fields/18“,”display_name“:”Decision Sciences“},”domain“:{”id“:”https://openalex.org/domains/2“,”“display_name”:“社会科学”}},{”id“:”https://openalex.org/T13976“,”“display_name”:“学术研究中的网络计量分析”,“score”:0.9837,“subfield”:{“id”:“https://openalex.org/subfields/1710“,”display_name“:”Information Systems“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/web-data-extraction网站“,”display_name“:”Web数据提取“,”score“:0.649487},{”id“:”https://openalex.org/keywords/information检索“,”display_name“:”信息检索“,”score“:0.549529},{”id“:”https://openalex.org/keywords/data-cleaning(https://openalex.org/keywords/data-cleaning)“,”display_name“:”数据清理“,”score“:0.543832},{”id“:”https://openalex.org/keywords/data-integration网站“,”display_name“:”数据集成“,”score“:0.535989},{”id“:”https://openalex.org/keywords/internet-research网站“,”display_name“:”Internet Research“,”score“:0.512955}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.6767142},{”id“:”https://openalex.org/C4554734网址,“wikidata”:https://www.wikidata.org/wiki/Q593744“,”display_name“:”知识库“,”level“:2,”score“:0.6384193},{”id“:”https://openalex.org/C195807954,“wikidata”:https://www.wikidata.org/wiki/Q1662562“,”display_name“:”信息提取“,”level“:2,”score“:0.57977664},{”id“:”https://openalex.org/C42058472,“wikidata”:https://www.wikidata.org/wiki/Q810214“,”display_name“:”Base(topology)“,”level“:2,”score“:0.5115477},{”id“:”https://openalex.org/C2777220311,“wikidata”:https://www.wikidata.org/wiki/Q6423340“,”display_name“:”知识获取“,”level“:2,”score“:0.4912824},{”id“:”https://openalex.org/C23123220,“wikidata”:https://www.wikidata.org/wiki/Q816826“,”display_name“:”信息检索“,”level“:1,”score“:0.45963034},{”id“:”https://openalex.org/C4725764,“wikidata”:https://www.wikidata.org/wiki/Q844704“,”display_name“:”提取(化学)“,”级别“:2,”分数“:0.45215416},{”id“:”https://openalex.org/C120567893,“wikidata”:https://www.wikidata.org/wiki/Q1582085“,”display_name“:”知识提取“,”level“:2,”score“:0.42733},{”id“:”https://openalex.org/C2522767166,“wikidata”:https://www.wikidata.org/wiki/Q2374463“,”display_name“:”数据科学“,”level“:1,”score“:0.41535085},{”id“:”https://openalex.org/C56739046,“wikidata”:https://www.wikidata.org/wiki/Q192060“,”display_name“:”知识管理“,”level“:1,”score“:0.34212407},{”id“:”https://openalex.org/C124101348,“wikidata”:https://www.wikidata.org/wiki/Q172491“,”display_name“:”数据挖掘“,”level“:1,”score“:0.27710795},{”id“:”https://openalex.org/C136764020,“wikidata”:https://www.wikidata.org/wiki/Q466“,”display_name“:”万维网“,”级别“:1,”分数“:0.27178252},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.09965718},{”id“:”https://openalex.org/C185592680,“wikidata”:https://www.wikidata.org/wiki/Q2329“,”display_name“:”Chemistry“,”level“:0,”score“:0.06687957},{”id“:”https://openalex.org/C134306372,“wikidata”:https://www.wikidata.org/wiki/Q7754“,”display_name“:”数学分析“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C43617362,“wikidata”:https://www.wikidata.org/wiki/Q170050“,”display_name“:”Chromatography“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1,”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/icsc.2018.00045“,”pdf_url“:null,”source“:null,”license“:null:”license_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false}],”best_oa_location“:nul,”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[]:”,“referenced_works_count”:8,“referrenced_works”:[”https://openalex.org/W121874958","https://openalex.org/W1489992655","https://openalex.org/W1968053850","https://openalex.org/W2022322548","https://openalex.org/W2104086170","https://openalex.org/W2142276227","https://openalex.org/W2289610612","https://openalex.org/W2911456401“],”related_works“:[”https://openalex.org/W2599749361","https://openalex.org/W2385713529","https://openalex.org/W2382915105","https://openalex.org/W2380657991","https://openalex.org/W2140138473","https://openalex.org/W2019276034","https://openalex.org/W1988622546","https://openalex.org/W1850639582","https://openalex.org/W1582777578","https://openalex.org/W1520100787“],”ngrams_url“:”https://api.openalex.org/works/W2797980629/ngrams网站“,”abstract_inverted_index“:{”Here“:[0],”we“:[1,33],”present“:[2],”the“:[3,62,84,92103],”process“:[4,85],”of“:[5,29,81,86100102150],”data“:[6,30,44,59,94109],”acquisition“:[7110],”and“:[8,15,23,36,40,96111],”information“:[9,52,87111212],”extraction“:[100123],”for“:[11108],”building“:”[12],“a”:[113120140],“综合”:[14],“准确”:[16],“科学”:[17141],“知识”:[18146],“基础”:[19],“包括”:[20],“会议”:[21],“出版物”:[22],“科学家”。“:[24],”我们“:[25,50114],”使用“:[26],”两个“:[27,78],”种类“:[28],”来源。“:[31],”首先“:[32],”聚集“:[34],”结构化“:[35],”可靠“:[37],”但是“:[38],”不理解“:[39],”不是“:[41],”总是“:[42],”最新“:[43],”源“:[45,56,80],”这样“:[46],”如“:[47125127],”数字“:[48],”图书馆。“:[49],”enrich“:[51],”extracted“:[53],”from“:[54,61],”these“:[55],”with“:57],”unstructured“:[58,93],”getabled“:60],”Internet“:[63],”by“:[64118128],”filtering“:[65],”websites“:[66],”using“:67129],”SVM“:[68],”classifier“:[69],”to“:[70131],”identifidential“:[71],”potentially“:[72],“有用”:[73],“网络”:[74],“页面。“:[75],”There“:[76],”are“:[77136],”potential“:[79],”errors“:[82],”in“:[88319],”富集。“:[88],”The“:[89],”first“:[90],”is“:[91,98],”origin“:[95],”another“:/97],”lack“:[99],”accuracy“:[101],”machine“:[104],”learning“:[105],”methods“:[106135],”used“:[107138],”extraction“。“:[113],”地址“:[115],”两者“:[116],”问题“:[117],”提议“:[119],”新“:[121],”方法“:[124],”好“:[126],”众包“:[130],”正确“:[132],”信息。“:[133],”我们的“:[134],”当前“:[137],”平台;“:[142],”即,“:[143],”Omega-Psir“:[144],”大学“:[145],”基地“:[147],”包含“:[148],”列表“:[149],”研究人员“:[151],”出版物“:[152],”事件“:[153],”等“:[154]},”引用_by_api_url“:”https://api.openalex.org/works?filter=cites:W2797980629“,”counts_by_year“:[{”年份“:2021,”cited_by_count“:2},{”年“:2019,”cited_by_count”:1}],”更新日期“:”2024-06-17T07:44:01.268860“,”创建日期“:“2018-04-24”}