{“id”:“https://openalex.org/W2068365491“,”doi“:”https://doi.org/10.1145/1456223.1456277“,”title“:”数据预处理“,”display_name“:”数据预处理“,”publication_year“:2008,”publication_date“:”2008-01-01“,”ids“:{”openalex“:”https://openalex.org/W2068365491“,”doi“:”https://doi.org/10.1145/1456223.1456277“,”mag“:”2068365491“},”language“:”en“,”primary_location“:{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1145/1456223.1456277“,”pdf_url“:null,”source“:null,”license“:null',”licence_id“:null,”version“:nuller,”is_accepted“:false,”is_published“:false},”type“:”article“,”type_crossref“:“procesdings-article”,”indexed_in“:[”crossref“],”open_access“:{”is_oa“:false,”oa_status“:”closed“,”oa_url”:null“,”any_repository_has_fulltext“:false}”,”authorships“:[{”author_position“:”first“,”作者“:{”id“:”https://openalex.org/A5004343218“,”display_name“:”Marcela Xavier Ribeiro“,”orcid“:”https://orcid.org/0000-0002-2323-5326},“机构”:[{“id”:https://openalex.org/I17974374“,”display_name“:”圣保罗大学“,”ror“:”https://ror.org/036rp1748“,”country_code“:”BR“,”type“:“教育”,”世系“:[”https://openalex.org/I17974374“]}],”国家“:[”BR“],”is_corresponding“:false,”raw_author_name“:”Marcela X.Ribeiro“,”raw _ affiliation_strings“:[“圣保罗大学,圣卡洛斯,SP,巴西”],”affiliation“:[{”raw _affiliation_string“:”圣保罗大学https://openalex.org/I17974374“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5090938898“,”display_name“:”M\u00f4nica Ribeiro Porto Ferreira“,”orcid“:null},”institutions“:[{”id“:”https://openalex.org/I17974374“,”display_name“:”圣保罗大学“,”ror“:”https://ror.org/036rp1748“,”country_code“:”BR“,”type“:“教育”,”世系“:[”https://openalex.org/I17974374“]}],”国家“:[”BR“],”is_corresponding“:false,”raw_author_name“:”M\u00f4nica R.P.Ferreira“,”raw _ affiliation_strings“:[“巴西圣卡洛斯圣保罗大学”],”affiliation“:[{”raw _affiliation_string“:”巴西圣卡洛斯圣保罗大学https://openalex.org/I17974374“]}]},{”author_position“:”middle“,”author“:{”id“:”https://openalex.org/A5020611078“,”display_name“:”Caetano Traina“,”orcid“:”https://orcid.org/0000-0002-6625-6047},“机构”:[{“id”:https://openalex.org/I17974374“,”display_name“:”圣保罗大学“,”ror“:”https://ror.org/036rp1748“,”country_code“:”BR“,”type“:“教育”,”世系“:[”https://openalex.org/I17974374“]}],”国家“:[”BR“],”is_corresponding“:false,”raw_author_name“:”Caetano Traina“,”raw _ afiliation_strings“:[“圣保罗大学,圣卡洛斯,SP,巴西”],”affiliations“:[{”raw_ afiliation _string“:”圣保罗大学https://openalex.org/I17974374“]}]},{”author_position“:”last“,”author“:{”id“:”https://openalex.org/A5014783020“,”display_name“:”Agma J.M.Traina“,”orcid“:”https://orcid.org/0000-0003-4929-7258},“机构”:[{“id”:https://openalex.org/I17974374“,”display_name“:”圣保罗大学“,”ror“:”https://ror.org/036rp1748“,”country_code“:”BR“,”type“:“教育”,”世系“:[”https://openalex.org/I17974374“]}],”国家“:[”BR“],”is_corresponding“:false,”raw_author_name“:”Agma J.M.Traina“,”raw _ affiliation_strings“:[“圣保罗大学,圣卡洛斯,SP,巴西”],”affiliation“:[{”raw _affiliation_string“:”圣保罗大学https://openalex.org/I17974374“]}]}],”countries_distinct_count“:1,”institutions_disting_count”:1,“corresponding_author_ids”:[],”correspounding_institution_ids“:[]”,“apc_list”:null,”apc_payed“:null”,“fwci”:0.832,“has_fulltext”:true,“fulltext_origin”:“ngrams”,“cited_by_count”:9,“citeconding_by_percentile_year”:{“min”:84,“max”:85},“biblio”“:{”volume“:null,”issue“:nul,”first_page“:null,”last_page“:null},”is_retracted“:false,”is_paratext“:fase,”primary_topic“:{”id“:”https://openalex.org/T10538“,”“display_name”:“数据挖掘技术与应用”,“score”:0.9987,“subfield”:{“id”:“https://openalex.org/subfields/1710“,”display_name“:”Information Systems“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},”主题“:[{”id“:”https://openalex.org/T10538“,”“display_name”:“数据挖掘技术与应用”,“score”:0.9987,“subfield”:{“id”:“https://openalex.org/subfields/1710“,”display_name“:”Information Systems“},”field“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T10320“,”display_name“:”神经网络基础与应用“,”score“:0.993,”subfield“:{”id“:”https://openalex.org/subfields/1702“,”display_name“:”人工智能“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}},{”id“:”https://openalex.org/T11063“,”“display_name”:“粗糙集理论与应用”,“score”:0.9914,“subfield”:{“id”:“https://openalex.org/subfields/1703“,”display_name“:”计算理论与数学“},”字段“:{”id“:”https://openalex.org/fields/17“,”display_name“:”Computer Science“},”domain“:{”id“:”https://openalex.org/domains/3“,”display_name“:”物理科学“}}],”关键词“:[{”id“:”https://openalex.org/keywords/data-mining“,”display_name“:”数据挖掘“,”score“:0.540372},{”id“:”https://openalex.org/keywords/temoral-data-mining“,”display_name“:”时态数据挖掘“,”score“:0.522189},{”id“:”https://openalex.org/keywords/feature-selection网站“,”display_name“:”功能选择“,”score“:0.510163},{”id“:”https://openalex.org/keywords/dep-learning网站“,”display_name“:”深度学习“,”score“:0.509865},{”id“:”https://openalex.org/keywords/decision-analysis网站“,”display_name“:”决策分析“,”score“:0.502992}],”concepts“:[{”id“:”https://openalex.org/C73000952,“wikidata”:https://www.wikidata.org/wiki/Q17007827“,”display_name“:”Discretization“,”level“:2,”score“:0.87303936},{”id“:”https://openalex.org/C148483581,“wikidata”:https://www.wikidata.org/wiki/Q446488“,”display_name“:”功能选择“,”级别“:2,”分数“:0.80968404},{”id“:”https://openalex.org/C41008148,“wikidata”:https://www.wikidata.org/wiki/Q21198“,”display_name“:”计算机科学“,”level“:0,”score“:0.66533196},{”id“:”https://openalex.org/C124101348,“wikidata”:https://www.wikidata.org/wiki/Q172491网址“,”display_name“:”数据挖掘“,”level“:1,”score“:0.6078021},{”id“:”https://openalex.org/C105427703,“wikidata”:https://www.wikidata.org/wiki/Q665193“,”display_name“:”连续特征的离散化“,”level“:4,”score“:0.57966995},{”id“:”https://openalex.org/C84525736,“wikidata”:https://www.wikidata.org/wiki/Q831366“,”display_name“:”决策树“,”level“:2,”score“:0.55628777},{”id“:”https://openalex.org/C10551718,“wikidata”:https://www.wikidata.org/wiki/Q5227332“,”display_name“:”数据预处理“,”level“:2,”score“:0.5458865},{”id“:”https://openalex.org/C138827492,“wikidata”:https://www.wikidata.org/wiki/Q6661985“,”display_name“:”数据处理“,”level“:2,”score“:0.51628345},{”id“:”https://openalex.org/C2776401178,“wikidata”:https://www.wikidata.org/wiki/Q12050496“,”display_name“:”功能(语言学)“,”级别“:2,”分数“:0.46297237},{”id“:”https://openalex.org/C154945302,“wikidata”:https://www.wikidata.org/wiki/Q11660“,”display_name“:”人工智能“,”level“:1,”score“:0.4533311},{”id“:”https://openalex.org/C2779557605,“wikidata”:https://www.wikidata.org/wiki/Q9890“,”display_name“:”Omega“,”level“:2,”score“:0.4495805},{”id“:”https://openalex.org/C26517878,“wikidata”:https://www.wikidata.org/wiki/Q228039“,”display_name“:”Key(lock)“,”level“:2,”score“:0.43056163},{”id“:”https://openalex.org/C95623464,“wikidata”:https://www.wikidata.org/wiki/Q1096149“,”display_name“:”分类器(UML)“,”level“:2,”score“:0.42474866},{”id“:”https://openalex.org/C153180895,“wikidata”:https://www.wikidata.org/wiki/Q7148389“,”display_name“:”模式识别(心理学)“,”level“:2,”score“:0.39850247},{”id“:”https://openalex.org/C119857082,“wikidata”:https://www.wikidata.org/wiki/Q2539“,”display_name“:”机器学习“,”level“:1,”score“:0.37032837},{”id“:”https://openalex.org/C126148662,“wikidata”:https://www.wikidata.org/wiki/Q3890355“,”display_name“:”离散化错误“,”level“:3,”score“:0.3406137},{”id“:”https://openalex.org/C33923547,“wikidata”:https://www.wikidata.org/wiki/Q395“,”display_name“:”数学“,”等级“:0,”分数“:0.19568098},{”id“:”https://openalex.org/C77088390,“wikidata”:https://www.wikidata.org/wiki/Q8513“,”display_name“:”Database“,”level“:1,”score“:0.07428804},{”id“:”https://openalex.org/C134306372,“wikidata”:https://www.wikidata.org/wiki/Q7754“,”display_name“:”数学分析“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C41895202,“wikidata”:https://www.wikidata.org/wiki/Q8162“,”display_name“:”语言学“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C138885662,“wikidata”:https://www.wikidata.org/wiki/Q5891“,”display_name“:”哲学“,”等级“:0,”分数“:0.0},{”id“:”https://openalex.org/C121332964,“wikidata”:https://www.wikidata.org/wiki/Q413“,”display_name“:”物理“,”级别“:0,”分数“:0.0},{”id“:”https://openalex.org/C38652104,“wikidata”:https://www.wikidata.org/wiki/Q3510521“,”display_name“:”计算机安全“,”level“:1,”score“:0.0},{”id“:”https://openalex.org/C62520636,“wikidata”:https://www.wikidata.org/wiki/Q944“,”display_name“:”量子力学“,”level“:1,”score“:0.0}],”mesh“:[],”locations_count“:1.”locations“:[{”is_oa“:false,”landing_page_url“:”https://doi.org/10.1145/1456223.1456277“,”pdf_url“:null,”source“:null,”license“:null,”license_id“:null,”version“:null,”is_accepted“:false,”is_published“:false}],”best_oa_location“:null,”sustainable_development_goals“:[],”grants“:[],”dataset“:[],”version“:[],”referenced_works_count“:21,”referenced_works“:[”https://openalex.org/W1513366687","https://openalex.org/W15233989055","https://openalex.org/W1543818407","https://openalex.org/W1569097076","https://openalex.org/W1583700199","https://openalex.org/W1585743408","https://openalex.org/W1678889691","https://openalex.org/W2097569937","https://openalex.org/W2097839764","https://openalex.org/W2112122409","https://openalex.org/W2119594161","https://openalex.org/W2122175496","https://openalex.org/W2132166479","https://openalex.org/W2135511047","https://openalex.org/W2141355396","https://openalex.org/W2148949939","https://openalex.org/W2149851883","https://openalex.org/W2161919332","https://openalex.org/W2738642287","https://openalex.org/W3120740533","https://openalex.org/W90901292“],”related_works“:[”https://openalex.org/W3200179079","https://openalex.org/W3016666932","https://openalex.org/W2938355325","https://openalex.org/W2888936415","https://openalex.org/W2774597805","https://openalex.org/W2348794337网址","https://openalex.org/W2335687691","https://openalex.org/W2109293916","https://openalex.org/W2068365491","https://openalex.org/W1968641190“],”ngrams_url“:”https://api.openalex.org/works/W2068365491/ngrams“,”“abstract_inverted_index”:{“Data”:[0,32],“pre-processing”:[1,16116190],“is”:[2176],“a”:[3,68],“key”:[4],“element”:[5],“to”:[6,24,46162178],“improve”:[7],“the”:[8,15,18,26,47,54,58112115119122131133140146150155165],“accurability”:[9],“of”:[10,5714121145149152164168],“Data”:[11,19]59,72,80,96134181191193],“挖掘“:[12,27,60194],”算法。“:[13],”In“:[14,62130],”step“:[17],”are“:[20,37],”treated“:[21],”In“:[22118],”order“:[23],“make”:[25],“process”:[28],“reasible”:[29],“and”:[30,34,50,74,82100102107154183],“effectived”。“:[31],”离散化“:[33,73,81,97135182],”特征“:[35,75,83103156184],”选择“:[36104157],”两个“:[38],”重要“:[39],”任务“:[40],”that“:[41174],”can“:[42,51],”be“:[43],”performed“:[44],”previor“:[45],”learning“:[48],”phase“:[49],”significally“:[52],”reduce“:[53],”处理“:[55],”努力“:[56],”算法。“:[61],”this“:[63],”paper“:[64],”we“:[65],”present“:[66],”Omega“:[67],”new“:/69],”algorithm“:[00124],”for“:[71,95189192],”selection。“:[76,84],”Omega“:[77,871318160175],”执行“:[78],”同时“:[79],”我们“:[85],”验证“:[86],”通过“:[88137159],”比较“:[89],”it“:[90],”与“:[91143],”其他“:[92],”众所周知“:[93126],”算法“:[94],”(1R,”:[98],”ChiMerge“:[99],”Chi2)“:[101],”(DTM,”:[105],“救济”:[106],“Chi2)。“:[108],”The“:[109],”testings“:[110],”compared“:[111],”effects“:+113],”technologies“:[117],”results“:/120172],”C4.5“:[123],”(a“:[125],”decision“:[127141],”tree-based“:%128],”classifier“)。“:[129],”结果“:[132],”提供“:[136],”生成“:[139],”树“:[142],”一“:[144163],”最小“:[147166],”平均“:[148167],”数量“:[151],”节点“:[153],”给定“:[158],”引线“:[161],”错误“:[169],”速率。“:[170],”这些“:[171],”表示“:[173],”非常适合“:[177],”执行“:[179],”两者,“:[180],”选择“:[185],”存在“:[186],”高度“:[187],”适当“:[188],”任务。“:[195]},”cited_by_api_url“:”https://api.openalex.org/works?filter=引用:W2068365491“,”counts_by_year“:[{“年份”:2023,”cited_by_count“:1},{“年”:2021,”ciped_by_cunt“:1},”{“年度”:2020,“cited_by_count”:1}.,{”year“:2019,”cited_by_count?:1}:2015,”citted_by_count“:1}],”updated_date“:”2024-07-16T01:31:25.448374“,”created_date:“2016-06-24”}