<codeBook xmlns="ddi:codebook:2_5" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="ddi:codebook:2_5 https://ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" version="2.5"><docDscr><citation><titlStmt><titl>A two-stage registry-anchored approach for precision improvement in organization name recognition from PubMed affiliation strings: a validation study</titl><IDNo agency="DOI">doi:10.7910/DVN/M5PRZB</IDNo></titlStmt><distStmt><distrbtr source="archive">Harvard Dataverse</distrbtr><distDate>2026-02-04</distDate></distStmt><verStmt source="archive"><version date="2026-02-05" type="RELEASED">2</version></verStmt><biblCit>Kang, Inmo; Park, Joonmo; Jeong, Heesoo; Chung, Seyoung; Jeon, Changmin; Moon, Seongwuk, 2026, "A two-stage registry-anchored approach for precision improvement in organization name recognition from PubMed affiliation strings: a validation study", https://doi.org/10.7910/DVN/M5PRZB, Harvard Dataverse, V2</biblCit></citation></docDscr><stdyDscr><citation><titlStmt><titl>A two-stage registry-anchored approach for precision improvement in organization name recognition from PubMed affiliation strings: a validation study</titl><IDNo agency="DOI">doi:10.7910/DVN/M5PRZB</IDNo></titlStmt><rspStmt><AuthEnty affiliation="Graduate School of Management of Technology, Sogang Univeristy, Seoul, Korea">Kang, Inmo</AuthEnty><AuthEnty affiliation="Graduate School of Management of Technology, Sogang Univeristy, Seoul, Korea">Park, Joonmo</AuthEnty><AuthEnty affiliation="Graduate School of Management of Technology, Sogang Univeristy, Seoul, Korea">Jeong, Heesoo</AuthEnty><AuthEnty affiliation="Graduate School of Management of Technology, Sogang Univeristy, Seoul, Korea">Chung, Seyoung</AuthEnty><AuthEnty affiliation="Graduate School of Management of Technology, Sogang Univeristy, Seoul, Korea">Jeon, Changmin</AuthEnty><AuthEnty affiliation="Graduate School of Management of Technology, Sogang Univeristy, Seoul, Korea">Moon, Seongwuk</AuthEnty></rspStmt><prodStmt/><distStmt><distrbtr source="archive">Harvard Dataverse</distrbtr><contact affiliation="Sogang University, Seoul, Korea" email="seongwuk@sogang.ac.kr">Moon, Seongwuk</contact><depositr>(KCSE), Korean Councils of Science Editors</depositr><depDate>2026-02-04</depDate></distStmt><holdings URI="https://doi.org/10.7910/DVN/M5PRZB"/></citation><stdyInfo><subject><keyword xml:lang="en">Social Sciences</keyword></subject><abstract>Dataset 1. The dataset analyzed during the current study.</abstract><sumDscr/></stdyInfo><method><dataColl><sources/></dataColl><anlyInfo/></method><dataAccs><setAvail/><useStmt/><notes type="DVN:TOU" level="dv">&lt;a href="http://creativecommons.org/publicdomain/zero/1.0">CC0 1.0&lt;/a></notes></dataAccs><othrStdyMat/></stdyDscr><otherMat ID="f13435379" URI="https://dataverse.harvard.edu/api/access/datafile/13435379" level="datafile"><labl>20251220_SciEdit_ROR corpus_Submit.json</labl><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">application/json</notes></otherMat><otherMat ID="f13434960" URI="https://dataverse.harvard.edu/api/access/datafile/13434960" level="datafile"><labl>Dataset 1. The dataset analyzed during the current study..csv</labl><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">text/comma-separated-values</notes></otherMat><otherMat ID="f13435378" URI="https://dataverse.harvard.edu/api/access/datafile/13435378" level="datafile"><labl>geo_data.json</labl><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">application/json</notes></otherMat><otherMat ID="f13434973" URI="https://dataverse.harvard.edu/api/access/datafile/13434973" level="datafile"><labl>Suppl. 1. Methods for constructing the ROR corpus, PubMed sample, and gold standard..pdf</labl><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">application/pdf</notes></otherMat><otherMat ID="f13434972" URI="https://dataverse.harvard.edu/api/access/datafile/13434972" level="datafile"><labl>Suppl. 2. Model implementation details..pdf</labl><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">application/pdf</notes></otherMat><otherMat ID="f13434971" URI="https://dataverse.harvard.edu/api/access/datafile/13434971" level="datafile"><labl>Suppl. 3. Evaluation metrics and baseline implementation..pdf</labl><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">application/pdf</notes></otherMat></codeBook>