{"id":"https://openalex.org/W4315706601","doi":"https://doi.org/10.48550/arxiv.2301.04000","title":"Privacy-Preserving Record Linkage for Cardinality Counting","display_name":"Privacy-Preserving Record Linkage for Cardinality Counting","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4315706601","doi":"https://doi.org/10.48550/arxiv.2301.04000"},"language":"en","primary_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2301.04000","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false},"type":"preprint","type_crossref":"posted-content","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/abs/2301.04000","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041278405","display_name":"Nan Wu","orcid":"https://orcid.org/0000-0002-9429-2889"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Nan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079324810","display_name":"Dinusha Vatsalan","orcid":"https://orcid.org/0000-0001-6713-7667"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vatsalan, Dinusha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040251515","display_name":"Mohamed Ali K\u00e2afar","orcid":"https://orcid.org/0000-0003-2714-0276"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kaafar, Mohamed Ali","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5066805147","display_name":"Sanath Kumar Ramesh","orcid":"https://orcid.org/0000-0002-9793-7742"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramesh, Sanath Kumar","raw_affiliation_strings":[],"affiliations":[]}],"institution_assertions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":0,"max":67},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9989,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9778,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cardinality","display_name":"Cardinality (data modeling)","score":0.7494321},{"id":"https://openalex.org/keywords/record-linkage","display_name":"Record Linkage","score":0.57451737}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.75074077},{"id":"https://openalex.org/C87117476","wikidata":"https://www.wikidata.org/wiki/Q362383","display_name":"Cardinality (data modeling)","level":2,"score":0.7494321},{"id":"https://openalex.org/C142210648","wikidata":"https://www.wikidata.org/wiki/Q1266546","display_name":"Record linkage","level":3,"score":0.57451737},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4784108},{"id":"https://openalex.org/C64869954","wikidata":"https://www.wikidata.org/wiki/Q1859747","display_name":"False positive paradox","level":2,"score":0.46547386},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.45963934},{"id":"https://openalex.org/C123201435","wikidata":"https://www.wikidata.org/wiki/Q456632","display_name":"Information privacy","level":2,"score":0.45018047},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.43863606},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.363456},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2532555},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17046738},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.13821805},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2301.04000","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":true,"landing_page_url":"http://arxiv.org/abs/2301.04000","pdf_url":"http://arxiv.org/pdf/2301.04000","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false},{"is_oa":false,"landing_page_url":"https://api.datacite.org/dois/10.48550/arxiv.2301.04000","pdf_url":null,"source":{"id":"https://openalex.org/S4393179698","display_name":"DataCite API","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210145204","host_organization_name":"DataCite","host_organization_lineage":["https://openalex.org/I4210145204"],"host_organization_lineage_names":["DataCite"],"type":"metadata"},"license":null,"license_id":null,"version":null}],"best_oa_location":{"is_oa":true,"landing_page_url":"https://arxiv.org/abs/2301.04000","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":["Cornell University"],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false},"sustainable_development_goals":[],"grants":[],"datasets":[],"versions":[],"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4301272096","https://openalex.org/W4280518517","https://openalex.org/W3111878056","https://openalex.org/W2950751300","https://openalex.org/W2183246718","https://openalex.org/W2148038983","https://openalex.org/W2058438338","https://openalex.org/W2019471580","https://openalex.org/W2002177687","https://openalex.org/W1557094818"],"abstract_inverted_index":{"Several":[0],"applications":[1,21,24,50,63],"require":[2],"counting":[3,18,30,37,53,81,119,149],"the":[4,10,16,38,54,67,80,125,177,197,203,216,230,269],"number":[5,39,68,199,232],"of":[6,40,42,69,72,98,179,200,220,233,251,256],"distinct":[7],"items":[8],"in":[9,100,124,181,235,249],"data,":[11],"which":[12],"is":[13,82],"known":[14],"as":[15,26,52,65,202,209],"cardinality":[17,114,118,137,148,178,204],"problem.":[19],"Example":[20],"include":[22],"health":[23],"such":[25,51,64],"rare":[27],"disease":[28,45],"patients":[29],"for":[31,46,57,79,103,112,136],"adequate":[32],"awareness":[33],"and":[34,36,61,86,88,107,128,157,175,218,243,273],"funding,":[35],"cases":[41],"a":[43,58,129,163,225,261],"new":[44,59],"outbreak":[47],"detection,":[48],"marketing":[49],"visibility":[55],"reached":[56],"product,":[60],"cybersecurity":[62],"tracking":[66],"unique":[70],"views":[71],"social":[73],"media":[74],"posts.":[75],"The":[76,96],"data":[77,99],"needed":[78],"however":[83],"often":[84],"personal":[85],"sensitive,":[87],"need":[89],"to":[90,173,195,228,268],"be":[91],"processed":[92],"using":[93,150,169],"privacy-preserving":[94,117,131,147,165],"techniques.":[95],"quality":[97],"different":[101],"databases,":[102],"example":[104],"typos,":[105],"errors":[106],"variations,":[108],"poses":[109],"additional":[110],"challenges":[111],"accurate":[113,208],"estimation.":[115],"While":[116],"has":[120,141],"gained":[121],"much":[122],"attention":[123],"recent":[126],"times":[127],"few":[130],"algorithms":[132],"have":[133],"been":[134,144],"developed":[135],"estimation,":[138],"no":[139],"work":[140],"so":[142],"far":[143,206],"done":[145],"on":[146,241],"record":[151,166],"linkage":[152,167],"techniques":[153,172],"with":[154,260],"fuzzy":[155,271],"matching":[156,272],"provable":[158],"privacy":[159,187,262],"guarantees.":[160],"We":[161,223],"propose":[162,224],"novel":[164,226],"algorithm":[168],"unsupervised":[170,236],"clustering":[171,274],"link":[174],"count":[176],"individuals":[180],"multiple":[182],"datasets":[183,245],"without":[184],"compromising":[185],"their":[186],"or":[188],"identity.":[189],"In":[190],"addition,":[191],"existing":[192],"Elbow":[193],"methods":[194],"find":[196,229],"optimal":[198,231],"clusters":[201,234],"are":[205,246],"from":[207],"they":[210],"do":[211],"not":[212],"take":[213],"into":[214],"account":[215],"purity":[217],"completeness":[219],"generated":[221],"clusters.":[222],"method":[227],"learning.":[237],"Our":[238],"experimental":[239],"results":[240],"real":[242],"synthetic":[244],"highly":[247],"promising":[248],"terms":[250],"significantly":[252],"smaller":[253],"error":[254],"rate":[255],"less":[257],"than":[258],"0.1":[259],"budget":[263],"{\\epsilon}":[264],"=":[265],"1.0":[266],"compared":[267],"state-of-the-art":[270],"method.":[275]},"cited_by_api_url":"https://api.openalex.org/works?filter=cites:W4315706601","counts_by_year":[],"updated_date":"2025-01-08T21:41:26.181679","created_date":"2023-01-12"}
  NODES