{"id":"https://openalex.org/W4315705847","doi":"https://doi.org/10.48550/arxiv.2301.03726","title":"Neighborhood-Regularized Self-Training for Learning with Few Labels","display_name":"Neighborhood-Regularized Self-Training for Learning with Few Labels","publication_year":2023,"publication_date":"2023-01-10","ids":{"openalex":"https://openalex.org/W4315705847","doi":"https://doi.org/10.48550/arxiv.2301.03726"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2301.03726","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.03726","pdf_url":"https://arxiv.org/pdf/2301.03726","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2301.03726","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100687200","display_name":"Ran Xu","orcid":"https://orcid.org/0000-0003-1387-6696"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Ran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100397967","display_name":"Yue Yu","orcid":"https://orcid.org/0000-0002-3683-5208"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Yue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033157677","display_name":"Hejie Cui","orcid":"https://orcid.org/0000-0001-6388-2619"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Hejie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070286873","display_name":"Xuan Kan","orcid":"https://orcid.org/0000-0003-0076-8346"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kan, Xuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015101640","display_name":"Yanqiao Zhu","orcid":"https://orcid.org/0000-0003-2205-5304"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Yanqiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022272635","display_name":"Joyce C. Ho","orcid":"https://orcid.org/0000-0001-9168-3916"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ho, Joyce","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100460272","display_name":"Chao Zhang","orcid":"https://orcid.org/0000-0003-3009-598X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5006897094","display_name":"Carl Yang","orcid":"https://orcid.org/0000-0001-9145-4531"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Carl","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9552000164985657,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7691486477851868},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.6433767676353455},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6378348469734192},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6230067014694214},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5894521474838257},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5644534826278687},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.5601657032966614},{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.5073680281639099},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.47488683462142944},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.4426214396953583},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.44242992997169495},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.43332844972610474},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4333120584487915},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4142463803291321},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08488580584526062},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.07169532775878906},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.0633344054222107}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7691486477851868},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.6433767676353455},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6378348469734192},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6230067014694214},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5894521474838257},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5644534826278687},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.5601657032966614},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.5073680281639099},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.47488683462142944},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.4426214396953583},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.44242992997169495},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.43332844972610474},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4333120584487915},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4142463803291321},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08488580584526062},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.07169532775878906},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.0633344054222107},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2301.03726","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.03726","pdf_url":"https://arxiv.org/pdf/2301.03726","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2301.03726","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2301.03726","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2301.03726","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.03726","pdf_url":"https://arxiv.org/pdf/2301.03726","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7200000286102295}],"awards":[{"id":"https://openalex.org/G1726583756","display_name":"III: Small: Go Beyond Short-term Dependency and Homogeneity: A General-Purpose Transformer Recipe for Multi-Domain Heterogeneous Sequential Data Analysis","funder_award_id":"2008334","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2477648378","display_name":null,"funder_award_id":"IIS-2145411","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2893488462","display_name":"BigData:IA:Collaborative Research: TIMES: A tensor factorization platform for spatio-temporal data","funder_award_id":"1838200","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3494058236","display_name":"CAREER: Aequitas: A comprehensive machine learning framework to decode health disparities","funder_award_id":"2145411","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6484623147","display_name":"III: Medium: Collaborative Research: Principled Uncertainty Quantification in Deep Learning Models for Time Series Analysis","funder_award_id":"2106961","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6671297155","display_name":null,"funder_award_id":"CAREER","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8844335058","display_name":null,"funder_award_id":"IIS-1838200","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320309381","display_name":"Emory University","ror":"https://ror.org/03czfpz43"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4315705847.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2361861616","https://openalex.org/W2263699433","https://openalex.org/W2377979023","https://openalex.org/W2218034408","https://openalex.org/W2392921965","https://openalex.org/W2944823289","https://openalex.org/W2383111961","https://openalex.org/W2365952365","https://openalex.org/W2358755282","https://openalex.org/W2352448290"],"abstract_inverted_index":{"Training":[0],"deep":[1],"neural":[2],"networks":[3],"(DNNs)":[4],"with":[5,55,106,145],"limited":[6],"supervision":[7],"has":[8,23],"been":[9,24],"a":[10,65],"popular":[11],"research":[12],"topic":[13],"as":[14],"it":[15,38],"can":[16],"significantly":[17],"alleviate":[18],"the":[19,42,51,72,84,102,130,141,146],"annotation":[20],"burden.":[21],"Self-training":[22],"successfully":[25],"applied":[26],"in":[27],"semi-supervised":[28],"learning":[29],"tasks,":[30],"but":[31],"one":[32],"drawback":[33],"of":[34,74,132,140],"self-training":[35,81,104],"is":[36,39],"that":[37,53,97,123],"vulnerable":[40],"to":[41,59,70,156],"label":[43],"noise":[44,131],"from":[45,86],"incorrect":[46],"pseudo":[47,76,133],"labels.":[48,77],"Inspired":[49],"by":[50,135],"fact":[52],"samples":[54],"similar":[56,61],"labels":[57,134],"tend":[58],"share":[60],"representations,":[62],"we":[63],"develop":[64],"neighborhood-based":[66],"sample":[67,90],"selection":[68,127],"approach":[69],"tackle":[71],"issue":[73],"noisy":[75],"We":[78],"further":[79,120],"stabilize":[80],"via":[82],"aggregating":[83],"predictions":[85],"different":[87],"rounds":[88],"during":[89],"selection.":[91],"Experiments":[92],"on":[93,117],"eight":[94],"tasks":[95],"show":[96],"our":[98,124],"proposed":[99,125],"method":[100],"outperforms":[101],"strongest":[103],"baseline":[105],"1.83%":[107],"and":[108,114,137,151],"2.51%":[109],"performance":[110],"gain":[111],"for":[112],"text":[113],"graph":[115],"datasets":[116],"average.":[118],"Our":[119,149],"analysis":[121],"demonstrates":[122],"data":[126],"strategy":[128],"reduces":[129],"36.8%":[136],"saves":[138],"57.3%":[139],"time":[142],"when":[143],"compared":[144],"best":[147],"baseline.":[148],"code":[150],"appendices":[152],"will":[153],"be":[154],"uploaded":[155],"https://github.com/ritaranx/NeST.":[157]},"counts_by_year":[],"updated_date":"2026-06-22T08:00:12.763002","created_date":"2025-10-10T00:00:00"}
