{"id":4033946,"identifier":"DVN/9ICICY","persistentUrl":"https://doi.org/10.7910/DVN/9ICICY","protocol":"doi","authority":"10.7910","separator":"/","publisher":"Harvard Dataverse","publicationDate":"2020-08-26","storageIdentifier":"file://10.7910/DVN/9ICICY","datasetType":"dataset","datasetVersion":{"id":204287,"datasetId":4033946,"datasetPersistentId":"doi:10.7910/DVN/9ICICY","storageIdentifier":"file://10.7910/DVN/9ICICY","versionNumber":1,"versionMinorNumber":0,"versionState":"RELEASED","latestVersionPublishingState":"RELEASED","deaccessionLink":"","lastUpdateTime":"2020-08-26T09:11:32Z","releaseTime":"2020-08-26T09:11:32Z","createTime":"2020-08-25T08:57:05Z","publicationDate":"2020-08-26","citationDate":"2020-08-26","license":{"name":"CC0 1.0","uri":"http://creativecommons.org/publicdomain/zero/1.0","iconUri":"https://licensebuttons.net/p/zero/1.0/88x31.png","rightsIdentifier":"CC0-1.0","rightsIdentifierScheme":"SPDX","schemeUri":"https://spdx.org/licenses/","languageCode":"en"},"fileAccessRequest":false,"metadataBlocks":{"citation":{"displayName":"Citation Metadata","name":"citation","fields":[{"typeName":"title","multiple":false,"typeClass":"primitive","value":"Replication Data for: Not Just Conspiracy Theories:  Vaccine Opponents and Proponents add to the COVID-19 ‘Infodemic’ on Twitter"},{"typeName":"author","multiple":true,"typeClass":"compound","value":[{"authorName":{"typeName":"authorName","multiple":false,"typeClass":"primitive","value":"Broniatowski, David"},"authorAffiliation":{"typeName":"authorAffiliation","multiple":false,"typeClass":"primitive","value":"The George Washington University"}}]},{"typeName":"datasetContact","multiple":true,"typeClass":"compound","value":[{"datasetContactName":{"typeName":"datasetContactName","multiple":false,"typeClass":"primitive","value":"Broniatowski, David"},"datasetContactAffiliation":{"typeName":"datasetContactAffiliation","multiple":false,"typeClass":"primitive","value":"The George Washington University"},"datasetContactEmail":{"typeName":"datasetContactEmail","multiple":false,"typeClass":"primitive","value":"broniatowski@gwu.edu"}}]},{"typeName":"dsDescription","multiple":true,"typeClass":"compound","value":[{"dsDescriptionValue":{"typeName":"dsDescriptionValue","multiple":false,"typeClass":"primitive","value":"These files contain the data required to replicate all findings in the referenced paper. Files include:\r\n\r\n1) 2000_Account_IDs.txt -- a tab-separated text file listing the top 2000 accounts mentioning vaccine-related keywords in CY 2019.\r\n2) users_ids.csv -- a comma-separated file listing all tweet IDs containing coronavirus-related keywords generated by each of the 2000 accounts. The first entry on each line is a username, followed by a list of tweet IDs.\r\n3) users_botscores.txt -- a tab-separated text file listing the bot scores generated from querying Botometer on March 2, 2020. The first entry is the raw (English) bot score and the second entry is the CAP score. \r\n4) corona_topic_keys.txt -- the top 20 words for each of 35 topics generated using the LDA algorithm fit to all tweets listed in users_ids.csv\r\n5) corona_doc_topics.txt -- LDA model topic results fit to each tweet in users_ids.csv. The second column corresponds to the tweet ID, and the following 35 columns are topic proportions for topics 0-34, respectively."}}]},{"typeName":"subject","multiple":true,"typeClass":"controlledVocabulary","value":["Computer and Information Science","Medicine, Health and Life Sciences","Social Sciences"]},{"typeName":"depositor","multiple":false,"typeClass":"primitive","value":"Broniatowski, David"},{"typeName":"dateOfDeposit","multiple":false,"typeClass":"primitive","value":"2020-08-25"}]}},"files":[{"description":"User ID, retweet count, and annotations for the 2000 most prolific accounts in the vaccine stream Twitter archive for calendar year 2019.","label":"2000_Account_IDs.txt","restricted":false,"version":1,"datasetVersionId":204287,"dataFile":{"id":4033950,"persistentId":"doi:10.7910/DVN/9ICICY/2UJMPA","pidURL":"https://doi.org/10.7910/DVN/9ICICY/2UJMPA","filename":"2000_Account_IDs.txt","contentType":"text/plain","friendlyType":"Plain Text","filesize":82350,"description":"User ID, retweet count, and annotations for the 2000 most prolific accounts in the vaccine stream Twitter archive for calendar year 2019.","storageIdentifier":"s3://dvn-cloud:17425aece6c-eadf8646ecd3","rootDataFileId":-1,"md5":"765d76a9dfc3afc8c33df411eee6d711","checksum":{"type":"MD5","value":"765d76a9dfc3afc8c33df411eee6d711"},"tabularData":false,"creationDate":"2020-08-25","publicationDate":"2020-08-26","fileAccessRequest":false}},{"description":"LDA model topic results fit to each tweet in users_ids.csv. The second column corresponds to the tweet ID, and the following 35 columns are topic proportions for topics 0-34, respectively.","label":"corona_doc_topics.txt","restricted":false,"version":1,"datasetVersionId":204287,"dataFile":{"id":4033949,"persistentId":"doi:10.7910/DVN/9ICICY/ZL605Z","pidURL":"https://doi.org/10.7910/DVN/9ICICY/ZL605Z","filename":"corona_doc_topics.txt","contentType":"text/plain","friendlyType":"Plain Text","filesize":58582774,"description":"LDA model topic results fit to each tweet in users_ids.csv. The second column corresponds to the tweet ID, and the following 35 columns are topic proportions for topics 0-34, respectively.","storageIdentifier":"s3://dvn-cloud:17425af4e5f-98ced1413462","rootDataFileId":-1,"md5":"90aab72a59912b5e15a184da4a1cc42d","checksum":{"type":"MD5","value":"90aab72a59912b5e15a184da4a1cc42d"},"tabularData":false,"creationDate":"2020-08-25","publicationDate":"2020-08-26","fileAccessRequest":false}},{"description":"The top 20 words for each of 35 topics generated using the LDA algorithm fit to all tweets listed in users_ids.csv","label":"corona_topic_keys.txt","restricted":false,"version":1,"datasetVersionId":204287,"dataFile":{"id":4033948,"persistentId":"doi:10.7910/DVN/9ICICY/MTSEWB","pidURL":"https://doi.org/10.7910/DVN/9ICICY/MTSEWB","filename":"corona_topic_keys.txt","contentType":"text/plain","friendlyType":"Plain Text","filesize":5707,"description":"The top 20 words for each of 35 topics generated using the LDA algorithm fit to all tweets listed in users_ids.csv","storageIdentifier":"s3://dvn-cloud:17425af5110-dd7ad3a3a69a","rootDataFileId":-1,"md5":"5d00e8b064678737e9b9b734c223fa6d","checksum":{"type":"MD5","value":"5d00e8b064678737e9b9b734c223fa6d"},"tabularData":false,"creationDate":"2020-08-25","publicationDate":"2020-08-26","fileAccessRequest":false}},{"description":"A tab-separated text file listing the bot scores generated from querying Botometer on March 2, 2020. The first entry is the raw (English) bot score and the second entry is the CAP score. ","label":"users_botscores.txt","restricted":false,"version":1,"datasetVersionId":204287,"dataFile":{"id":4033951,"persistentId":"doi:10.7910/DVN/9ICICY/IU5WBK","pidURL":"https://doi.org/10.7910/DVN/9ICICY/IU5WBK","filename":"users_botscores.txt","contentType":"text/plain","friendlyType":"Plain Text","filesize":94907,"description":"A tab-separated text file listing the bot scores generated from querying Botometer on March 2, 2020. The first entry is the raw (English) bot score and the second entry is the CAP score. ","storageIdentifier":"s3://dvn-cloud:17425af52c5-932955abe0b7","rootDataFileId":-1,"md5":"2c903355daf65f018e93a3aa47afd7b7","checksum":{"type":"MD5","value":"2c903355daf65f018e93a3aa47afd7b7"},"tabularData":false,"creationDate":"2020-08-25","publicationDate":"2020-08-26","fileAccessRequest":false}},{"description":"A comma-separated file listing all tweet IDs containing coronavirus-related keywords generated by each of the 2000 accounts. The first entry on each line is a username, followed by a list of tweet IDs.","label":"users_ids.csv","restricted":false,"version":1,"datasetVersionId":204287,"dataFile":{"id":4033947,"persistentId":"doi:10.7910/DVN/9ICICY/2TPWZH","pidURL":"https://doi.org/10.7910/DVN/9ICICY/2TPWZH","filename":"users_ids.csv","contentType":"text/csv","friendlyType":"Comma Separated Values","filesize":102034100,"description":"A comma-separated file listing all tweet IDs containing coronavirus-related keywords generated by each of the 2000 accounts. The first entry on each line is a username, followed by a list of tweet IDs.","storageIdentifier":"s3://dvn-cloud:17425b00007-055e76f32254","rootDataFileId":-1,"md5":"64945b46965939c2dcc8379cfb0c3817","checksum":{"type":"MD5","value":"64945b46965939c2dcc8379cfb0c3817"},"tabularData":false,"creationDate":"2020-08-25","publicationDate":"2020-08-26","fileAccessRequest":false}}],"citation":"Broniatowski, David, 2020, \"Replication Data for: Not Just Conspiracy Theories: Vaccine Opponents and Proponents add to the COVID-19 ‘Infodemic’ on Twitter\", https://doi.org/10.7910/DVN/9ICICY, Harvard Dataverse, V1"}}