diff --git a/110-PT-BN-KP.zip b/110-PT-BN-KP.zip deleted file mode 100644 index c5dd91f..0000000 Binary files a/110-PT-BN-KP.zip and /dev/null differ diff --git a/500N-KPCrowd-v1.2.zip b/500N-KPCrowd-v1.2.zip deleted file mode 100644 index 66952c3..0000000 Binary files a/500N-KPCrowd-v1.2.zip and /dev/null differ diff --git a/README b/README index 4281e4c..82dd7ad 100644 --- a/README +++ b/README @@ -5,8 +5,6 @@ This repository contains the datasets for automatic keyphrase extraction task. FILES -* 500N-KPCrowd.zip data from Marujo:LREC2012 (News articles annotated using AMT) -* 110-PT-BN-KP.zip data from Marujo:Interspeech2011 (non-English AKE corpus) * MAUI.tar.gz data from University of Waikato (KEA, MAUI systems) * Wan2008.tar.gz data from Wan:2008 * Schutz2008.tar.gz data from Schutz:2008 (only answer sets and readme are provided. the papers are available at ftp://ftp.ncbi.nlm.nih.gov/pub/pmc/articles.tar.gz) @@ -15,25 +13,6 @@ FILES BIBLIOGRAPHY -@InProceedings{Marujo:LREC2012, - Author = {Luis Marujo and Anatole Gershman and Jaime Carbonell and Robert Frederking and Jo\~{a}o P. Neto}, - Booktitle = {Proceedings of LREC 2012}, - Title = {Supervised Topical Key Phrase Extraction of News Stories using Crowdsourcing, Light Filtering and Co-reference Normalization}, - location = {Istanbul, Turkey}, - publisher = {ELRA}, - Year = {2012} -} - -@InProceedings{Marujo:Interspeech2011, - author = {Luis Marujo and M\'{a}rcio Viveiros and Jo\~{a}o P. Neto}, - title = {{Keyphrase Cloud Generation of Broadcast News}}, - booktitle = {Proceedings of Interspeech 2011}, - publisher = {ISCA}, - location = {Florence, Italy}, - year = {2011}, - month = {September} -} - @InProceedings{Wan:2008, author = {Xiaojun Wan and Jianguo Xiao}, title = {CollabRank: Towards a Collaborative Approach to Single-Document Keyphrase Extraction},