{"@context":{"@language":"en","@vocab":"https://schema.org/","citeAs":"cr:citeAs","column":"cr:column","conformsTo":"dct:conformsTo","cr":"http://mlcommons.org/croissant/","rai":"http://mlcommons.org/croissant/RAI/","data":{"@id":"cr:data","@type":"@json"},"dataType":{"@id":"cr:dataType","@type":"@vocab"},"dct":"http://purl.org/dc/terms/","examples":{"@id":"cr:examples","@type":"@json"},"extract":"cr:extract","field":"cr:field","fileProperty":"cr:fileProperty","fileObject":"cr:fileObject","fileSet":"cr:fileSet","format":"cr:format","includes":"cr:includes","isLiveDataset":"cr:isLiveDataset","jsonPath":"cr:jsonPath","key":"cr:key","md5":"cr:md5","parentField":"cr:parentField","path":"cr:path","recordSet":"cr:recordSet","references":"cr:references","regex":"cr:regex","repeated":"cr:repeated","replace":"cr:replace","sc":"https://schema.org/","separator":"cr:separator","source":"cr:source","subField":"cr:subField","transform":"cr:transform","wd":"https://www.wikidata.org/wiki/"},"@type":"sc:Dataset","conformsTo":"http://mlcommons.org/croissant/1.0","name":"A two-stage registry-anchored approach for precision improvement in organization name recognition from PubMed affiliation strings: a validation study","url":"https://doi.org/10.7910/DVN/M5PRZB","creator":[{"@type":"Person","givenName":"Inmo","familyName":"Kang","affiliation":{"@type":"Organization","name":"Graduate School of Management of Technology, Sogang Univeristy, Seoul, Korea"},"sameAs":"https://orcid.org/0009-0009-9244-6360","@id":"https://orcid.org/0009-0009-9244-6360","identifier":"https://orcid.org/0009-0009-9244-6360","name":"Kang, Inmo"},{"@type":"Person","givenName":"Joonmo","familyName":"Park","sameAs":"https://orcid.org/0009-0007-5917-5701","@id":"https://orcid.org/0009-0007-5917-5701","identifier":"https://orcid.org/0009-0007-5917-5701","name":"Park, Joonmo"},{"@type":"Person","givenName":"Heesoo","familyName":"Jeong","sameAs":"https://orcid.org/0009-0005-9592-8788","@id":"https://orcid.org/0009-0005-9592-8788","identifier":"https://orcid.org/0009-0005-9592-8788","name":"Jeong, Heesoo"},{"@type":"Person","givenName":"Seyoung","familyName":"Chung","sameAs":"https://orcid.org/0009-0006-0037-1065","@id":"https://orcid.org/0009-0006-0037-1065","identifier":"https://orcid.org/0009-0006-0037-1065","name":"Chung, Seyoung"},{"@type":"Person","givenName":"Changmin","familyName":"Jeon","sameAs":"https://orcid.org/0009-0000-0711-1158","@id":"https://orcid.org/0009-0000-0711-1158","identifier":"https://orcid.org/0009-0000-0711-1158","name":"Jeon, Changmin"},{"@type":"Person","givenName":"Seongwuk","familyName":"Moon","sameAs":"https://orcid.org/0000-0003-0375-533X","@id":"https://orcid.org/0000-0003-0375-533X","identifier":"https://orcid.org/0000-0003-0375-533X","name":"Moon, Seongwuk"}],"description":"Dataset 1. The dataset analyzed during the current study.","keywords":["Social Sciences"],"license":"http://creativecommons.org/publicdomain/zero/1.0","datePublished":"2026-02-04","dateModified":"2026-02-04","includedInDataCatalog":{"@type":"DataCatalog","name":"Harvard Dataverse","url":"https://dataverse.harvard.edu"},"publisher":{"@type":"Organization","name":"Harvard Dataverse"},"version":"2.0","citeAs":"@data{DVN/M5PRZB_2026,author = {Kang, Inmo and Park, Joonmo and Jeong, Heesoo and Chung, Seyoung and Jeon, Changmin and Moon, Seongwuk},publisher = {Harvard Dataverse},title = {A two-stage registry-anchored approach for precision improvement in organization name recognition from PubMed affiliation strings: a validation study},year = {2026},url = {https://doi.org/10.7910/DVN/M5PRZB}}","distribution":[{"@type":"cr:FileObject","@id":"20251220_SciEdit_ROR corpus_Submit.json","name":"20251220_SciEdit_ROR corpus_Submit.json","encodingFormat":"application/json","md5":"1c2d5d72a7f57d200105acbbf6f45f16","contentSize":"27951904","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/13435379"},{"@type":"cr:FileObject","@id":"Dataset 1. The dataset analyzed during the current study..csv","name":"Dataset 1. The dataset analyzed during the current study..csv","encodingFormat":"text/comma-separated-values","md5":"9eb6a588057ed3c3a7d25e3fdfc876fe","contentSize":"16368830","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/13434960"},{"@type":"cr:FileObject","@id":"geo_data.json","name":"geo_data.json","encodingFormat":"application/json","md5":"9b090e6a99b096bce98fdc3b2fb37cef","contentSize":"10177","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/13435378"},{"@type":"cr:FileObject","@id":"Suppl. 1. Methods for constructing the ROR corpus, PubMed sample, and gold standard..pdf","name":"Suppl. 1. Methods for constructing the ROR corpus, PubMed sample, and gold standard..pdf","encodingFormat":"application/pdf","md5":"4e2604a1ab8497320e4b0ec083a57dd9","contentSize":"145280","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/13434973"},{"@type":"cr:FileObject","@id":"Suppl. 2. Model implementation details..pdf","name":"Suppl. 2. Model implementation details..pdf","encodingFormat":"application/pdf","md5":"4cfddb6438f9dca0447289be589b4b46","contentSize":"165417","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/13434972"},{"@type":"cr:FileObject","@id":"Suppl. 3. Evaluation metrics and baseline implementation..pdf","name":"Suppl. 3. Evaluation metrics and baseline implementation..pdf","encodingFormat":"application/pdf","md5":"db2e048a41708585454e11f7e96d4e3f","contentSize":"144969","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/13434971"}]}