{“id”:“https://openalex.org/W2910372031“,”doi“:”https://doi.org/10.109/siu.2018.8404678“,”title“:”关系数据库中的近重复检测“,”display_name“:”关联数据库中的接近重复检测“、”publication_year“:2018、”publiation_date“:”2018-05-01“,”ids“:{”openalex“:”https://openalex.org/W2910372031“,”doi“:”https://doi.org/10.109/siu.2018.8404678“,”mag“:”2910372031“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/siu.2018.8404678“,”pdf_url“:null,”source“:null,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:false,”oa_status“:”closed“,”oa_url”:null“,”any_repository_has_fulltext“:false}”,”authorships“:[{”author_position“:”first“,”作者“:{”id“:”https://openalex.org/A5012244756“,”display_name“:”Ahmet Tu\u011frul Bayrak“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“,”Ahmet-Tugrul Bayrake“,”raw _affiliation_strings“:【”ETSTUR,\u0130stanbul,T\u00fcrkiye“】},{“author_position”:“middle”,“author”:{“id”https://openalex.org/A5033509879“,”display_name“:”Aykut Inan Yilmaz“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Aykut Inan Yelmaz“,”raw _affiliation_string“:[”ETSTUR,\u0130stanbul,T\u00fcrkiye“]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5078823708“,”display_name“:”Kemal Burak Yilmaz“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Kemal-Burak Yelmaz“,”raw _affiliation_string“:[”ETSTUR,\u0130stanbul,T\u00fcrkiye“]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5089441412“,”display_name“:”Remzi D\u00fcza\u011fa\u00e7“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Remzi Duzagac“,”raw _affiliation_string“:[”ETSTUR,\u0130stanbul,T\u00fcrkiye“]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5034053831“,”display_name“:”Veri Bilimi“,”orcid“:null},”institutions“:[],”countries“:[],”is_corresponding“:false,”raw_author_name“:”Veri Bilimi“,”raw _affiliation_string“:[”ETSTUR,\u0130stanbul,T\u00fcrkiye“]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5077241173“,”display_name“:”Analitik Bolumu“,”orcid“:null},”institutions“:[],”countries“:[],”is_correresponsing“:false,”raw_author_name“:”Analitik Bolumu“,”raw_affiation_strings“:[”ETSTUR,\u0130stanbul,T\u00fcurkiye“]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5040262351“,”display_name“:”Olcay Taner Y\u0131ld\u0131 z“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I167234411“,”display_name“:”I\u015f\u0131k University“,”ror“:”网址:https://ror.org/02j8k6t75“,”country_code“:”TR“,”type“:“教育”,”世系“:[”https://openalex.org/I167234411“]}],”国家“:[”TR“],”is_corresponding“:false,”raw_author_name“:”Olcay Taner Yildiz“,”raw _affiliation_strings“:[“I\u015fik\u00dcniversitesi Bilgisayar M\u00fchendisli\u011fi B\u00f6l\u00fcm\u00fc“]}”,“countries_distiction_count”:1,“institutions_distition_count“:1,”corresponding_author_ids“:[],“corresponding_institution_id”:[],“apc_list”:空,“apc_payd“:null,”has_fulltext“:false,”cited_by_count“:5,”cited_by_percentile_year“:{”min“:82,”max“:83},”biblio“:{“volume”:null“,”issue“:nul,”first_page“:null,”last_page“:null},“is_retracted”:false“is_paratext”:false,“primary_topic”:{“id”:“https://openalex.org/T11719“,”display_name“:”数据质量评估和改进“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1803“,”display_name“:”管理科学与运筹学“},”字段“:{”id“:”https://openalex.org/fields/18“,”display_name“:”Decision Sciences“},”domain“:{”id“:”https://openalex.org/domains/2“,”display_name“:”社会科学“}},”主题“:[{”id“:”https://openalex.org/T11719“,”display_name“:”数据质量评估和改进“,”score“:1.0,”subfield“:{”id“:”https://openalex.org/subfields/1803“,”display_name“:”管理科学与运筹学“},”字段“:{”id“:”https://openalex.org/fields/18“,”display_name“:”Decision Sciences“},”domain“:{”id“:”https://openalex.org/domains/2“,”“display_name”:“社会科学”}},{”id“:”https://openalex.org/T2016“,”“display_name”:“Web数据提取和爬网技术”,“score”:0.9892,“subfield”:{“id”:“https://openalex.org/subfields/1710“,”display_name“:”Information Systems“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10764“,”“display_name”:“数据分析和机器学习的隐私保护技术”,“score”:0.9885,“subfield”:{“id”:“https://openalex.org/subfields/s702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/duplicate检测“,”display_name“:”重复检测“,”score“:0.613281},{”id“:”https://openalex.org/keywords/data-records-mining网站“,”display_name“:”数据记录挖掘“,”score“:0.563278},{”id“:”https://openalex.org/keywords/data-cleaning网站“,”display_name“:”数据清理“,”score“:0.516823},{”id“:”https://openalex.org/keywords/machine-learning网站“,”display_name“:”机器学习“,”score“:0.506414}],”concepts“:[{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.6989292},{”id“:”https://openalex.org/C135598885,“wikidata”:https://www.wikidata.org/wiki/Q1366302“,”display_name“:”Row“,”level“:2,”score“:0.65953386},{”id“:”https://openalex.org/C5655090,“wikidata”:https://www.wikidata.org/wiki/Q192588“,”display_name“:”关系数据库“,”level“:2,”score“:0.6543227},{”id“:”https://openalex.org/C103278499,“wikidata”:https://www.wikidata.org/wiki/Q254465“,”display_name“:”相似性(几何)“,”level“:3,”score“:0.55508053},{”id“:”https://openalex.org/C23123220,“wikidata”:https://www.wikidata.org/wiki/Q816826“,”display_name“:”信息检索“,”level“:1,”score“:0.5520815},{”id“:”https://openalex.org/C77088390,“wikidata”:https://www.wikidata.org/wiki/Q8513“,”display_name“:”数据库“,”级别“:1,”分数“:0.4860783},{”id“:”https://openalex.org/C124101348,“wikidata”:https://www.wikidata.org/wiki/Q172491“,”display_name“:”数据挖掘“,”level“:1,”score“:0.4235924},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.19894406},{”id“:”https://openalex.org/C115961682,“wikidata”:https://www.wikidata.org/wiki/Q860623“,”display_name“:”Image(mathematics)“,”level“:2,”score“:0.0}],”mesh“:[],”locations_count“:1,”location“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.109/siu.2018.8404678“,”pdf_url“:null,”source“:null,”license“:null:”license_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false}],”best_oa_location“:nul,”sustainable_development_goals“:[],”grants“:[],”datasets“:],”versions“:[]:”,“referenced_works_count”:6,“referrenced_works”:[”https://openalex.org/W1961147827","https://openalex.org/W2024770506","https://openalex.org/W2036216970","https://openalex.org/W2052390074","https://openalex.org/W2164456230","https://openalex.org/W2296107147“],”related_works“:[”https://openalex.org/W4375869232","https://openalex.org/W4309137527","https://openalex.org/W4281971614","https://openalex.org/W3175260668","https://openalex.org/W3122721839","https://openalex.org/W3021032895","https://openalex.org/W2982353255","https://openalex.org/W2953259538","https://openalex.org/W2390933768","https://openalex.org/W108640429“],”ngrams_url“:”https://api.openalex.org/works/W2910372031/ngrams网站“,”“abstract_inverted_index”:{“While”:[0],“data”:[1,68,72],“amount”:[2],“increases”:[3],“number”:[4],“of”:[5,27,47],“duplicate”:[6,14,34,55,62],“records”:[7,15,35,56],“in”:[8,57],“relational”:[9],“数据库”:[10],“ingress”:[11],“graduplicate.”:[12],“The”:[13,60],“may”:[16],“原因”:[17],“不一致”:[18],“on”:[19],“报告”:[20],“和”:[21,70],“分析。“:[22],“To”:[23],“reduce”:[24],“the”:[25,48,67,71],“effects”:[26],“this”:/28],“problem”,“:[29],“we”:[30],“aim”:[31],“To”:[32,52],“detect”:[33,53],“using”:[36],“machine”:[37],“learning”:[3],“algorithms”:[39],“with”:%40],“features”:%41],“that”:[42],“are”:[43,64],“produced”:[44],“by”:[45],“similarity”:[46],“records”。“:[49,59],“我们”:[50],“实现”:[51],“28412”:[54],“9301467”:[58],“检测到”:[61],“行”:[63],“删除”:[65],“来自”:[66],“源”:[69],“成为”:[73],“更多”:[74],“一致”。“:[75]},”cited_by_api_url“:”https://api.openalex.org/works?filter=cites:W2910372031“,”counts_by_year“:[{”年份“:2022,”cited_by_count“:1},{”年“:2020,”cited_by_count”:1},{“年份”:2019,”citecd_by_count“:3}],”updated_date“:”2024-06-01T10:01:32.825163“,”created_dates“:”2019-01-25“}