SINAI/SFU-Review-SP-Neg
收藏数据集概述
数据集名称: SFU-Review-SP-Neg
语言: 西班牙语 (es)
标签: 否定
数据文件配置:
- 默认配置:
- 分割: 汽车 (coches)
- 路径: SFU_Review_SP_NEG_cue_scope_event_with_dependency_info_CoNLL/coches.txt
- 分割: 酒店 (hoteles)
- 路径: SFU_Review_SP_NEG_cue_scope_event_with_dependency_info_CoNLL/hoteles.txt
- 分割: 洗衣机 (lavadoras)
- 路径: SFU_Review_SP_NEG_cue_scope_event_with_dependency_info_CoNLL/lavadoras.txt
- 分割: 书籍 (libros)
- 路径: SFU_Review_SP_NEG_cue_scope_event_with_dependency_info_CoNLL/libros.txt
- 分割: 手机 (moviles)
- 路径: SFU_Review_SP_NEG_cue_scope_event_with_dependency_info_CoNLL/moviles.txt
- 分割: 音乐 (musica)
- 路径: SFU_Review_SP_NEG_cue_scope_event_with_dependency_info_CoNLL/musica.txt
- 分割: 电脑 (ordenadores)
- 路径: SFU_Review_SP_NEG_cue_scope_event_with_dependency_info_CoNLL/ordenadores.txt
- 分割: 电影 (peliculas)
- 路径: SFU_Review_SP_NEG_cue_scope_event_with_dependency_info_CoNLL/peliculas.txt
- 分割: 汽车 (coches)
数据集描述:
- 内容: 包含400篇来自Ciao.es网站的评论,涵盖汽车、酒店、洗衣机、书籍、手机、音乐、电脑和电影等8个领域。每个领域包含25篇正面和25篇负面评论。
- 注释: 每篇评论在词级别标注词干和词性,句子级别标注否定关键词、其语言范围、事件以及否定如何影响句子极性(是否改变极性或增加/减少其值),同时考虑强化词和弱化词。
许可证: CC-BY-NC-SA-4.0
引用信息: bibtex @article{article, author = {Zafra, Salud María and Delor, Mariona and Martín-Valdivia, Maria and López, L. and Martí, Antonia}, year = {2018}, month = {06}, pages = {1-37}, title = {SFU ReviewSP-NEG: a Spanish corpus annotated with negation for sentiment analysis. A typology of negation patterns}, volume = {52}, journal = {Language Resources and Evaluation}, doi = {10.1007/s10579-017-9391-x} }
bibtex @ARTICLE{Jiménez-Zafra2018240, author = {Jiménez-Zafra, Salud María and Martín-Valdivia, M. Teresa and Molina-González, M. Dolores and Ureña-López, L. Alfonso}, title = {Relevance of the SFU ReviewSP-NEG corpus annotated with the scope of negation for supervised polarity classification in Spanish}, year = {2018}, journal = {Information Processing and Management}, volume = {54}, number = {2}, pages = {240 – 251}, doi = {10.1016/j.ipm.2017.11.007}, url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85036470241&doi=10.1016%2fj.ipm.2017.11.007&partnerID=40&md5=ab1b45f84f48a0307ef6d0412de3e6a6}, type = {Article}, publication_stage = {Final}, source = {Scopus}, note = {Cited by: 9} }
bibtex @inproceedings{jimenez-zafra-etal-2016-problematic, title = "Problematic Cases in the Annotation of Negation in {S}panish", author = "Jim{e}nez-Zafra, Salud Mar{\i}a and Martin, Maite and Ure{~n}a-L{o}pez, L. Alfonso and Mart{\i}, Toni and Taul{e}, Mariona", editor = "Blanco, Eduardo and Morante, Roser and Saur{\i}, Roser", booktitle = "Proceedings of the Workshop on Extra-Propositional Aspects of Meaning in Computational Linguistics ({E}x{P}ro{M})", month = dec, year = "2016", address = "Osaka, Japan", publisher = "The COLING 2016 Organizing Committee", url = "https://aclanthology.org/W16-5006", pages = "42--48", abstract = "This paper presents the main sources of disagreement found during the annotation of the Spanish SFU Review Corpus with negation (SFU ReviewSP -NEG). Negation detection is a challenge in most of the task related to NLP, so the availability of corpora annotated with this phenomenon is essential in order to advance in tasks related to this area. A thorough analysis of the problems found during the annotation could help in the study of this phenomenon.", }
bibtex @article{PLN5335, author = {M. Antónia Martí y M. Teresa Martín-Valdivia y Mariona Taulé y Salud María Jiménez-Zafra y Montserrat Nofre y Laia Marsó}, title = {La negación en español: análisis y tipología de patrones de negación}, journal = {Procesamiento del Lenguaje Natural}, volume = {57}, number = {0}, year = {2016}, keywords = {}, abstract = {En este artículo se presentan los criterios aplicados para la anotación del corpus SFU ReviewSP-NEGcon negación y la tipología lingüística correspondiente. Esta tipología presenta la ventaja de ser fácilmente expresable en términos de un tagset para la anotación de corpus, de presentar tipos claramente delimitados, evitando así la ambigüedad en el proceso de anotación, y de presentar una amplia cobertura, es decir, que ha servido para resolver todos los casos que han aparecido. El corpus contiene 400 comentarios y 198.551 palabras. Actualmente está anotado en un 75% y, de un total de 6.331 oraciones revisadas, se han identificado 2.953 estructuras de negación.}, issn = {1989-7553}, url = {http://journal.sepln.org/sepln/ojs/ojs/index.php/pln/article/view/5335}, pages = {41--48} }



