{"@context":{"@language":"en","@vocab":"https://schema.org/","citeAs":"cr:citeAs","column":"cr:column","conformsTo":"dct:conformsTo","cr":"http://mlcommons.org/croissant/","rai":"http://mlcommons.org/croissant/RAI/","data":{"@id":"cr:data","@type":"@json"},"dataType":{"@id":"cr:dataType","@type":"@vocab"},"dct":"http://purl.org/dc/terms/","examples":{"@id":"cr:examples","@type":"@json"},"extract":"cr:extract","field":"cr:field","fileProperty":"cr:fileProperty","fileObject":"cr:fileObject","fileSet":"cr:fileSet","format":"cr:format","includes":"cr:includes","isLiveDataset":"cr:isLiveDataset","jsonPath":"cr:jsonPath","key":"cr:key","md5":"cr:md5","parentField":"cr:parentField","path":"cr:path","recordSet":"cr:recordSet","references":"cr:references","regex":"cr:regex","repeated":"cr:repeated","replace":"cr:replace","sc":"https://schema.org/","separator":"cr:separator","source":"cr:source","subField":"cr:subField","transform":"cr:transform","wd":"https://www.wikidata.org/wiki/"},"@type":"sc:Dataset","conformsTo":"http://mlcommons.org/croissant/1.0","name":"Replication Data for: CASM: A Deep-Learning Approach for Identifying Collective Action Events with Text and Image Data from Social Media","url":"https://doi.org/10.7910/DVN/SS4LNN","creator":[{"@type":"Person","givenName":"Jennifer","familyName":"Pan","affiliation":{"@type":"Organization","name":"Stanford University, Department of Communication"},"sameAs":"https://orcid.org/0000-0002-4818-0122","@id":"https://orcid.org/0000-0002-4818-0122","identifier":"https://orcid.org/0000-0002-4818-0122","name":"Pan, Jennifer"},{"@type":"Person","givenName":"Han","familyName":"Zhang","affiliation":{"@type":"Organization","name":"Princeton University, Department of Sociology"},"sameAs":"https://orcid.org/0000-0003-2912-8780","@id":"https://orcid.org/0000-0003-2912-8780","identifier":"https://orcid.org/0000-0003-2912-8780","name":"Zhang, Han"}],"description":"Protest event analysis is an important method for the study of collective action and social movements and typically draws on traditional media reports as the data source. We introduce collective action from social media (CASM)—a system that uses convolutional neural networks on image data and recurrent neural networks with long short-term memory on text data in a two-stage classifier to identify social media posts about offline collective action. We implement CASM on Chinese social media data and identify more than 100,000 collective action events from 2010 to 2017 (CASM-China). We evaluate the performance of CASM through cross-validation, out-of-sample validation, and comparisons with other protest data sets. We assess the effect of online censorship and find it does not substantially limit our identification of events. Compared to other protest data sets, CASM-China identifies relatively more rural, land-related protests and relatively few collective action events related to ethnic and religious conflict.","keywords":["Social Sciences","collective action, deep learning, event data, social media, China"],"license":"http://creativecommons.org/publicdomain/zero/1.0","datePublished":"2019-06-25","dateModified":"2019-06-25","includedInDataCatalog":{"@type":"DataCatalog","name":"Harvard Dataverse","url":"https://dataverse.harvard.edu"},"publisher":{"@type":"Organization","name":"Harvard Dataverse"},"version":"1.0","citeAs":"@data{DVN/SS4LNN_2019,author = {Pan, Jennifer and Zhang, Han},publisher = {Harvard Dataverse},title = {Replication Data for: CASM: A Deep-Learning Approach for Identifying Collective Action Events with Text and Image Data from Social Media},year = {2019},url = {https://doi.org/10.7910/DVN/SS4LNN}}","citation":[{"@type":"CreativeWork","name":"Zhang Han and Jennifer Pan. 2019. “CASM: A Deep-Learning Approach for Identifying Collective Action Events with Text and Image Data from Social Media” Sociological Methodology 49: 1-59."}],"distribution":[{"@type":"cr:FileObject","@id":"readme.txt","name":"readme.txt","encodingFormat":"text/plain","md5":"e3245b90afb53678ae1174ecfe232fcc","contentSize":"4918","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/U0U6TD"},{"@type":"cr:FileObject","@id":"requirements.txt","name":"requirements.txt","encodingFormat":"text/plain","md5":"4c3eb3b10aa0826da80d75ab07eb5c78","contentSize":"252","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/B1FZ7S"},{"@type":"cr:FileObject","@id":"lib/CASM_c1_deep_text.py","name":"CASM_c1_deep_text.py","encodingFormat":"text/x-python-script","md5":"566328cb7a8049c5982ec576dd37a0fd","contentSize":"4706","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/XIXZFJ"},{"@type":"cr:FileObject","@id":"lib/CASM_c2_deep_text.py","name":"CASM_c2_deep_text.py","encodingFormat":"text/x-python-script","md5":"d415031861898e6e73ed54ab5070280f","contentSize":"2126","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/JDYGYN"},{"@type":"cr:FileObject","@id":"lib/CASM_generate_predicted_probability_image.py","name":"CASM_generate_predicted_probability_image.py","encodingFormat":"text/x-python-script","md5":"d9de62895560149d03e2d375582b09e6","contentSize":"2146","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/WEIQ3Q"},{"@type":"cr:FileObject","@id":"lib/CASM_generate_predicted_probability_text.py","name":"CASM_generate_predicted_probability_text.py","encodingFormat":"text/x-python-script","md5":"db1d9eb0c6427f4ad019d08056f773e6","contentSize":"1904","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/TQBHP1"},{"@type":"cr:FileObject","@id":"lib/common_operations.py","name":"common_operations.py","encodingFormat":"text/x-python-script","md5":"f919552e59da8b3f4442fb5806e14e26","contentSize":"1830","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/JP4Y2E"},{"@type":"cr:FileObject","@id":"lib/dependency.py","name":"dependency.py","encodingFormat":"text/x-python-script","md5":"dbe26dcdc64eb0157228848a7b5be6c3","contentSize":"2738","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/A0TN2J"},{"@type":"cr:FileObject","@id":"lib/LSTM_text_dependency.py","name":"LSTM_text_dependency.py","encodingFormat":"text/x-python-script","md5":"68611cf69dbe364e16bc3ff09b467279","contentSize":"3849","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/M0EPHS"},{"@type":"cr:FileObject","@id":"lib/word_preprocessing.py","name":"word_preprocessing.py","encodingFormat":"text/x-python-script","md5":"8a187d27ea5e4f9f97742b4218cda0cd","contentSize":"5986","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/CCOULI"},{"@type":"cr:FileObject","@id":"modelfiles/image.json","name":"image.json","encodingFormat":"application/json","md5":"885fd25fab7df948a47308702cd00f6b","contentSize":"7662","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/F9ZBR6"},{"@type":"cr:FileObject","@id":"modelfiles/text-stage1.json","name":"text-stage1.json","encodingFormat":"application/json","md5":"89a8f86a1271fdafe843ac1d2cb3e88b","contentSize":"15090","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/3IS0FC"},{"@type":"cr:FileObject","@id":"modelfiles/text-stage2.json","name":"text-stage2.json","encodingFormat":"application/json","md5":"01f6d48037612de554ab63ac5f4921f2","contentSize":"3691","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/88AWK8"},{"@type":"cr:FileObject","@id":"modelfiles/weights_image.h5","name":"weights_image.h5","encodingFormat":"application/x-h5","md5":"0b8f7e6e5f15671354871166d2e69ac6","contentSize":"1019024","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/3JJZNA"},{"@type":"cr:FileObject","@id":"modelfiles/weights_text-stage1.h5","name":"weights_text-stage1.h5","encodingFormat":"application/x-h5","md5":"da69d85dc2a2c30fd5313d21d4d4a3b4","contentSize":"29714656","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/ZWPJMK"},{"@type":"cr:FileObject","@id":"modelfiles/weights_text-stage2.hdf5","name":"weights_text-stage2.hdf5","encodingFormat":"application/x-hdf5","md5":"4b98af52a07544cb8344cae29a97679c","contentSize":"161159592","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/DAAKAC"},{"@type":"cr:FileObject","@id":"output/protest_events.csv","name":"protest_events.csv","encodingFormat":"text/csv","md5":"a3e399dafe0357c18c850e0a394cc807","contentSize":"5408790","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/4N2EUS&format=original"},{"@type":"cr:FileObject","@id":"output/protest_posts.csv","name":"protest_posts.csv","encodingFormat":"text/csv","md5":"54c0b5acb889b71152588e5604125d77","contentSize":"227052755","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/KEQPZU"},{"@type":"cr:FileObject","@id":"plot/Figure10/protest_region_count_prefecture_log_scale.R","name":"protest_region_count_prefecture_log_scale.R","encodingFormat":"type/x-r-syntax","md5":"50a4c336d88c642fafc2a9b9d4c322c7","contentSize":"2224","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/Z8L832"},{"@type":"cr:FileObject","@id":"plot/Figure10/prefecture-shapefile/CN-shi-A.dbf","name":"CN-shi-A.dbf","encodingFormat":"application/dbf","md5":"402c8722d91dde1e29aa40641b915931","contentSize":"2843482","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/TEKVZP"},{"@type":"cr:FileObject","@id":"plot/Figure10/prefecture-shapefile/CN-shi-A.prj","name":"CN-shi-A.prj","encodingFormat":"application/prj","md5":"c7511977f2124a85517a0efb6d6ba6ed","contentSize":"437","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/EE9TZ7"},{"@type":"cr:FileObject","@id":"plot/Figure10/prefecture-shapefile/CN-shi-A.sbn","name":"CN-shi-A.sbn","encodingFormat":"application/sbn","md5":"495ee3c5eef7fc9c8da89bcc3d45604e","contentSize":"46764","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/ZQNCUV"},{"@type":"cr:FileObject","@id":"plot/Figure10/prefecture-shapefile/CN-shi-A.sbx","name":"CN-shi-A.sbx","encodingFormat":"application/sbx","md5":"c078f5504aa4d038a0982f565cb3eb5a","contentSize":"1580","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/L94OZX"},{"@type":"cr:FileObject","@id":"plot/Figure10/prefecture-shapefile/CN-shi-A.shp","name":"CN-shi-A.shp","encodingFormat":"application/shp","md5":"5e339a2fdb57e719e37fffdf3196c593","contentSize":"53346880","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/KHFNN8"},{"@type":"cr:FileObject","@id":"plot/Figure10/prefecture-shapefile/CN-shi-A.shx","name":"CN-shi-A.shx","encodingFormat":"application/shx","md5":"6b421c2c4bb275c31e863325eddfff0e","contentSize":"39316","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/PMP7JB"},{"@type":"cr:FileObject","@id":"plot/Figure11/CASM_divide_irrelevant.R","name":"CASM_divide_irrelevant.R","encodingFormat":"type/x-r-syntax","md5":"024675ef262d5d3504a2c3b5cae23f1b","contentSize":"2931","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/KUZI9Z"},{"@type":"cr:FileObject","@id":"plot/Figure11/keyword_search_placebo_count.csv","name":"keyword_search_placebo_count.csv","encodingFormat":"text/csv","md5":"d31725a44ca9132413c032e814248f66","contentSize":"10852","description":"Also used for plot/SuppFigure7","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/XTYK7N&format=original"},{"@type":"cr:FileObject","@id":"plot/Figure12/CASM_Wickedonna.R","name":"CASM_Wickedonna.R","encodingFormat":"type/x-r-syntax","md5":"e531b8138c1eaafe1c332e7b759a4d5b","contentSize":"3213","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/TBCYRV"},{"@type":"cr:FileObject","@id":"plot/Figure12/wicked_events_2018-11-29.csv","name":"wicked_events_2018-11-29.csv","encodingFormat":"text/csv","md5":"22b58602dfae2302e77dab00417536c6","contentSize":"13534829","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/XWCHD8"},{"@type":"cr:FileObject","@id":"plot/Figure4/firststage_c1_text_image_precision_recall.pdf","name":"firststage_c1_text_image_precision_recall.pdf","encodingFormat":"application/pdf","md5":"5f48c1bd72e4fd94dc85d2795d98770e","contentSize":"22550","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/DHHQMW"},{"@type":"cr:FileObject","@id":"plot/Figure4/firststage_c1_text_image_precision_recall.r","name":"firststage_c1_text_image_precision_recall.r","encodingFormat":"type/x-r-syntax","md5":"6ae0971a2bbbbcf91a444e518abd6a68","contentSize":"1581","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/F8IEN1"},{"@type":"cr:FileObject","@id":"plot/Figure4/firststage_c1_text_image_precision_recall.csv","name":"firststage_c1_text_image_precision_recall.csv","encodingFormat":"text/csv","md5":"bc1da5793f751857e85d2fd7310daa9c","contentSize":"289041","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/3XDMXX&format=original"},{"@type":"cr:FileObject","@id":"plot/Figure9/c1c2.csv","name":"c1c2.csv","encodingFormat":"text/csv","md5":"2cd4954991fbbe3a3ffb1f9ba48c953c","contentSize":"137767","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/SQI0WJ&format=original"},{"@type":"cr:FileObject","@id":"plot/Figure9/c1c2_precision_recall_crossvalidation.csv","name":"c1c2_precision_recall_crossvalidation.csv","encodingFormat":"text/csv","md5":"7a9c0483c528de29ade20a8873bed0af","contentSize":"339954","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/5HYIZN&format=original"},{"@type":"cr:FileObject","@id":"plot/Figure9/c1c2_vs_c1_precision_recall.pdf","name":"c1c2_vs_c1_precision_recall.pdf","encodingFormat":"application/pdf","md5":"bfecec42df5710dda4aa17fcea5b22b0","contentSize":"13934","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/QLTY5H"},{"@type":"cr:FileObject","@id":"plot/Figure9/c1c2_vs_c1_precision_recall.r","name":"c1c2_vs_c1_precision_recall.r","encodingFormat":"type/x-r-syntax","md5":"cfc6eea21f4c63541e9fffab937761c1","contentSize":"2655","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/DIQQRJ"},{"@type":"cr:FileObject","@id":"plot/Figure9/c1c2_vs_cross_validation_precision_recall.pdf","name":"c1c2_vs_cross_validation_precision_recall.pdf","encodingFormat":"application/pdf","md5":"e17b4de9c43f5208415474019e28a1e9","contentSize":"29291","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/R23RHQ"},{"@type":"cr:FileObject","@id":"plot/Figure9/c1c2_vs_cross_validation_precision_recall.r","name":"c1c2_vs_cross_validation_precision_recall.r","encodingFormat":"type/x-r-syntax","md5":"12a6a54194073b019f1270d53cc16933","contentSize":"2484","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/KTSBBO"},{"@type":"cr:FileObject","@id":"plot/Figure9/secondstage_c2_text_image_precision_recall.csv","name":"secondstage_c2_text_image_precision_recall.csv","encodingFormat":"text/csv","md5":"34e97e1821b937d2251eba38fbe1e50c","contentSize":"279984","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/LG7CMY&format=original"},{"@type":"cr:FileObject","@id":"plot/SuppFigure1/keywordCoverageSet.txt","name":"keywordCoverageSet.txt","encodingFormat":"text/plain","md5":"adf7c92cd57d834d30666de8c7e335c7","contentSize":"25990","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/MP3NXZ"},{"@type":"cr:FileObject","@id":"plot/SuppFigure1/keyword_coverage_wickedonna.pdf","name":"keyword_coverage_wickedonna.pdf","encodingFormat":"application/pdf","md5":"c95becba98db961b628827e25b97d229","contentSize":"11877","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/XNYN9C"},{"@type":"cr:FileObject","@id":"plot/SuppFigure1/supfig1.r","name":"supfig1.r","encodingFormat":"type/x-r-syntax","md5":"cbd27b23784f264b3ba64167a9ae2389","contentSize":"895","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/N9RBY0"},{"@type":"cr:FileObject","@id":"plot/SuppFigure2/keywordCoverageSet_keyword_year.txt","name":"keywordCoverageSet_keyword_year.txt","encodingFormat":"text/plain","md5":"61e2e139963b69b2fe26f0d248654ea8","contentSize":"114914","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/4XJUWL"},{"@type":"cr:FileObject","@id":"plot/SuppFigure2/keyword_coverage_wickedonna_by_year.pdf","name":"keyword_coverage_wickedonna_by_year.pdf","encodingFormat":"application/pdf","md5":"dd30ac6a555cd2fc6416ab51b23fdfc1","contentSize":"208090","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/WF2ENR"},{"@type":"cr:FileObject","@id":"plot/SuppFigure2/supfig2.r","name":"supfig2.r","encodingFormat":"type/x-r-syntax","md5":"45627cfc9155b2a0b536b4afeb9c6686","contentSize":"1015","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/2VBTRT"},{"@type":"cr:FileObject","@id":"plot/SuppFigure3/keywordCoverageSet_keyword_prov.txt","name":"keywordCoverageSet_keyword_prov.txt","encodingFormat":"text/plain","md5":"54a843cee1db484d9f56fff0878ab37e","contentSize":"837160","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/QNRESH"},{"@type":"cr:FileObject","@id":"plot/SuppFigure3/keyword_coverage_wickedonna_by_province.pdf","name":"keyword_coverage_wickedonna_by_province.pdf","encodingFormat":"application/pdf","md5":"ac197a6c75bac3664fa9477dc481c738","contentSize":"346989","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/2MNTVF"},{"@type":"cr:FileObject","@id":"plot/SuppFigure3/supfig3.r","name":"supfig3.r","encodingFormat":"type/x-r-syntax","md5":"1a08e1f8db1a7f84b0ef8d42a3ae734c","contentSize":"1613","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/0IAU94"},{"@type":"cr:FileObject","@id":"plot/SuppFigure4/keyword_vs_num_event_700000.pdf","name":"keyword_vs_num_event_700000.pdf","encodingFormat":"application/pdf","md5":"ba7e6a138603a6cc2aac4f1bc6f83b53","contentSize":"13515","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/IEG4YX"},{"@type":"cr:FileObject","@id":"plot/SuppFigure4/keyword_vs_num_event_700000_fig4.csv","name":"keyword_vs_num_event_700000_fig4.csv","encodingFormat":"text/csv","md5":"432279f6a13ec42eef027d68f77f0463","contentSize":"69109","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/JA9YXG&format=original"},{"@type":"cr:FileObject","@id":"plot/SuppFigure4/supfig4.r","name":"supfig4.r","encodingFormat":"type/x-r-syntax","md5":"38fec215de1bdf7f0a69aa76fba1dcc4","contentSize":"2565","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/SPJSDH"},{"@type":"cr:FileObject","@id":"plot/SuppFigure5/precision_vs_keyword.pdf","name":"precision_vs_keyword.pdf","encodingFormat":"application/pdf","md5":"0bf3a511cbb4809313893b4bf48c8c3b","contentSize":"19190","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/2VJNBB"},{"@type":"cr:FileObject","@id":"plot/SuppFigure5/precision_vs_keyword.csv","name":"precision_vs_keyword.csv","encodingFormat":"text/csv","md5":"7446a32d847a9bc881e9cb3d72a323df","contentSize":"104588","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/FF11SU&format=original"},{"@type":"cr:FileObject","@id":"plot/SuppFigure5/supfig5.r","name":"supfig5.r","encodingFormat":"type/x-r-syntax","md5":"ea64daf3d326d7d256f2c656c276bfc0","contentSize":"945","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/GJL5BL"},{"@type":"cr:FileObject","@id":"plot/SuppFigure6/firststage_c1_SVM_NB.csv","name":"firststage_c1_SVM_NB.csv","encodingFormat":"text/csv","md5":"edd1148369654c35dec40a81dec63a6a","contentSize":"263546","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/MRSZWA&format=original"},{"@type":"cr:FileObject","@id":"plot/SuppFigure6/firststage_c1_SVM_NB_precision_recall.pdf","name":"firststage_c1_SVM_NB_precision_recall.pdf","encodingFormat":"application/pdf","md5":"7a3df83b0994e9794ab0949a23668ec9","contentSize":"17609","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/LMSRVZ"},{"@type":"cr:FileObject","@id":"plot/SuppFigure6/supfig6.r","name":"supfig6.r","encodingFormat":"type/x-r-syntax","md5":"015f173bbe04cf556ac60627bc026f20","contentSize":"1607","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/ZW97UQ"},{"@type":"cr:FileObject","@id":"plot/SuppFigure7/CASM_keyword_irrelevant_count.pdf","name":"CASM_keyword_irrelevant_count.pdf","encodingFormat":"application/pdf","md5":"b92f76c8836017e0eedc3d76875c2474","contentSize":"14892","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/TGD7MK"},{"@type":"cr:FileObject","@id":"plot/SuppFigure7/supfig7.R","name":"supfig7.R","encodingFormat":"type/x-r-syntax","md5":"aa0f15068a607a01d12c1b815271f07d","contentSize":"3177","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/P6WSSE"},{"@type":"cr:FileObject","@id":"supporting/high_frequency_protest_words.txt","name":"high_frequency_protest_words.txt","encodingFormat":"text/plain","md5":"8221df85c452eaa8eae8b2da0970d6de","contentSize":"7611","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/F2TSZO"},{"@type":"cr:FileObject","@id":"supporting/jieba.dict.big.txt","name":"jieba.dict.big.txt","encodingFormat":"text/plain","md5":"62a9df455d0ee5881f099725db8d9d01","contentSize":"8583143","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/FTLWDW"},{"@type":"cr:FileObject","@id":"supporting/propaganda_media_words.txt","name":"propaganda_media_words.txt","encodingFormat":"text/plain","md5":"a1bc6a08f09bc7f2cf91d7ea878dc5c5","contentSize":"509","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/UKIOWE"},{"@type":"cr:FileObject","@id":"supporting/stopwords1.txt","name":"stopwords1.txt","encodingFormat":"text/plain","md5":"6d1f0322d729d9bb02a7cd98386cbba9","contentSize":"33171","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/6BUBZP"},{"@type":"cr:FileObject","@id":"supporting/village_level_dict.txt","name":"village_level_dict.txt","encodingFormat":"text/plain","md5":"4a55542530269ea1ff9f7cf30ae79d00","contentSize":"1003403","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/NZCHXT"},{"@type":"cr:FileObject","@id":"supporting/village_level_dict_reversed.txt","name":"village_level_dict_reversed.txt","encodingFormat":"text/plain","md5":"7bcca52a4fdb6b74c53f35802659e4a7","contentSize":"927873","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/DE0AZD"},{"@type":"cr:FileObject","@id":"supporting/vocab_pos_grievance.dict","name":"vocab_pos_grievance.dict","encodingFormat":"application/octet-stream","md5":"931671245e4ea9bba1037ea4b79f706c","contentSize":"2542865","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/D7XPL0"},{"@type":"cr:FileObject","@id":"supporting/vocab_pos_KGP_50000.dict","name":"vocab_pos_KGP_50000.dict","encodingFormat":"application/octet-stream","md5":"a947231c58e88a707d811d19f84dff88","contentSize":"1225912","description":"","contentUrl":"https://dataverse.harvard.edu/api/access/datafile/:persistentId?persistentId=doi:10.7910/DVN/SS4LNN/8H7TJ8"}],"recordSet":[{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"event_id\tforms\tissues","description":"event_id\tforms\tissues","dataType":"sc:Text","source":{"@id":"19871920","fileObject":{"@id":"output/protest_events.csv"},"extract":{"column":"event_id\tforms\tissues"}}}]},{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"month\tcount_all\tmonth_numeric\tquarter\tDataset\tyear","description":"month\tcount_all\tmonth_numeric\tquarter\tDataset\tyear","dataType":"sc:Text","source":{"@id":"19871943","fileObject":{"@id":"plot/Figure11/keyword_search_placebo_count.csv"},"extract":{"column":"month\tcount_all\tmonth_numeric\tquarter\tDataset\tyear"}}}]},{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"label","description":"label","dataType":"sc:Text","source":{"@id":"19871936","fileObject":{"@id":"plot/Figure4/firststage_c1_text_image_precision_recall.csv"},"extract":{"column":"label"}}},{"@type":"cr:Field","name":"precision","description":"precision","dataType":"sc:Float","source":{"@id":"19871935","fileObject":{"@id":"plot/Figure4/firststage_c1_text_image_precision_recall.csv"},"extract":{"column":"precision"}}},{"@type":"cr:Field","name":"recall","description":"recall","dataType":"sc:Float","source":{"@id":"19871934","fileObject":{"@id":"plot/Figure4/firststage_c1_text_image_precision_recall.csv"},"extract":{"column":"recall"}}}]},{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"label","description":"label","dataType":"sc:Text","source":{"@id":"19871923","fileObject":{"@id":"plot/Figure9/c1c2.csv"},"extract":{"column":"label"}}},{"@type":"cr:Field","name":"precision","description":"precision","dataType":"sc:Float","source":{"@id":"19871921","fileObject":{"@id":"plot/Figure9/c1c2.csv"},"extract":{"column":"precision"}}},{"@type":"cr:Field","name":"recall","description":"recall","dataType":"sc:Float","source":{"@id":"19871922","fileObject":{"@id":"plot/Figure9/c1c2.csv"},"extract":{"column":"recall"}}}]},{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"label","description":"label","dataType":"sc:Text","source":{"@id":"19871928","fileObject":{"@id":"plot/Figure9/c1c2_precision_recall_crossvalidation.csv"},"extract":{"column":"label"}}},{"@type":"cr:Field","name":"precision","description":"precision","dataType":"sc:Float","source":{"@id":"19871929","fileObject":{"@id":"plot/Figure9/c1c2_precision_recall_crossvalidation.csv"},"extract":{"column":"precision"}}},{"@type":"cr:Field","name":"recall","description":"recall","dataType":"sc:Float","source":{"@id":"19871930","fileObject":{"@id":"plot/Figure9/c1c2_precision_recall_crossvalidation.csv"},"extract":{"column":"recall"}}}]},{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"label","description":"label","dataType":"sc:Text","source":{"@id":"19871925","fileObject":{"@id":"plot/Figure9/secondstage_c2_text_image_precision_recall.csv"},"extract":{"column":"label"}}},{"@type":"cr:Field","name":"precision","description":"precision","dataType":"sc:Float","source":{"@id":"19871927","fileObject":{"@id":"plot/Figure9/secondstage_c2_text_image_precision_recall.csv"},"extract":{"column":"precision"}}},{"@type":"cr:Field","name":"recall","description":"recall","dataType":"sc:Float","source":{"@id":"19871924","fileObject":{"@id":"plot/Figure9/secondstage_c2_text_image_precision_recall.csv"},"extract":{"column":"recall"}}},{"@type":"cr:Field","name":"threshold","description":"threshold","dataType":"sc:Float","source":{"@id":"19871926","fileObject":{"@id":"plot/Figure9/secondstage_c2_text_image_precision_recall.csv"},"extract":{"column":"threshold"}}}]},{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"month","description":"month","dataType":"sc:Text","source":{"@id":"19871931","fileObject":{"@id":"plot/SuppFigure4/keyword_vs_num_event_700000_fig4.csv"},"extract":{"column":"month"}}},{"@type":"cr:Field","name":"nunique","description":"nunique","dataType":"sc:Integer","source":{"@id":"19871933","fileObject":{"@id":"plot/SuppFigure4/keyword_vs_num_event_700000_fig4.csv"},"extract":{"column":"nunique"}}},{"@type":"cr:Field","name":"rank","description":"rank","dataType":"sc:Integer","source":{"@id":"19871932","fileObject":{"@id":"plot/SuppFigure4/keyword_vs_num_event_700000_fig4.csv"},"extract":{"column":"rank"}}}]},{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"precision","description":"precision","dataType":"sc:Float","source":{"@id":"19871938","fileObject":{"@id":"plot/SuppFigure5/precision_vs_keyword.csv"},"extract":{"column":"precision"}}},{"@type":"cr:Field","name":"rank","description":"rank","dataType":"sc:Integer","source":{"@id":"19871937","fileObject":{"@id":"plot/SuppFigure5/precision_vs_keyword.csv"},"extract":{"column":"rank"}}},{"@type":"cr:Field","name":"recall","description":"recall","dataType":"sc:Float","source":{"@id":"19871939","fileObject":{"@id":"plot/SuppFigure5/precision_vs_keyword.csv"},"extract":{"column":"recall"}}}]},{"@type":"cr:RecordSet","field":[{"@type":"cr:Field","name":"label","description":"label","dataType":"sc:Text","source":{"@id":"19871940","fileObject":{"@id":"plot/SuppFigure6/firststage_c1_SVM_NB.csv"},"extract":{"column":"label"}}},{"@type":"cr:Field","name":"precision","description":"precision","dataType":"sc:Float","source":{"@id":"19871941","fileObject":{"@id":"plot/SuppFigure6/firststage_c1_SVM_NB.csv"},"extract":{"column":"precision"}}},{"@type":"cr:Field","name":"recall","description":"recall","dataType":"sc:Float","source":{"@id":"19871942","fileObject":{"@id":"plot/SuppFigure6/firststage_c1_SVM_NB.csv"},"extract":{"column":"recall"}}}]}]}