Name: Terraa/vis-desc-large
Creator: Terraa
Published: 2026-02-28 18:44:51
License: 暂无描述

下载链接：

https://hf-mirror.com/datasets/Terraa/vis-desc-large

下载链接

链接失效反馈

官方服务：

资源简介：

--- license: cc-by-sa-4.0 task_categories: - text-classification language: - en size_categories: - 10K<n<100K --- 100k segments of 60-500 characters heuristically labeled for evaluation of visual descriptiveness. Segments were sampled from: ```markdown | **Name** | **Description** | **Scores** | **#** | |-----------------------------------|------------------------------------------|-------------|--------| | flickr-megalith internlm2 | LLM-generated image captions | 5 | 15k | | flickr-megalith internlm2-short | LLM-generated image captions | 4 | 15k | | flickr30k | crowdsourced image captions | 2, 3, 4 | 15k | | MS COCO | crowdsourced image captions | 1, 2, 3 | 5k | | SBU Captions | raw Flickr image captions | 1, 2, 3 | 5k | | CMU Movie Summary Corpus | movie summaries | 1, 2, 3 | 5k | | CMU Book Summary Dataset | book summaries | 1, 2, 3 | 5k | | gutenberg-dialog | book dialogues | 0, 1, 2 | 5k | | wikitext | Wikipedia articles | 0, 1, 2 | 10k | | xsum | news articles | 0, 1, 2 | 5k | | tripadvisor-hotel-reviews | hotel reviews | 0, 1, 2 | 2k | | yelp-review-full | Yelp reviews | 0, 1, 2 | 3k | | scientific-papers | scientific papers from ArXiv | 0, 1 | 5k | | Amazon Reviews 2023 | Amazon reviews | 0, 1 | 5k | ``` ## Citations ```bibtex @misc{flickr10m, author = { Caption Emporium }, title = {flickr-megalith-10m-internvl2-multi-caption}, year = {2024}, publisher = {Huggingface}, journal = {Huggingface repository}, howpublished = {\url{https://huggingface.co/datasets/CaptionEmporium/flickr-megalith-10m-internvl2-multi-caption}}, } @article{flickr30k, author = {Young, Peter and Lai, Alice and Hodosh, Micah and Hockenmaier, Julia}, title = {{From image descriptions to visual denotations: New similarity metrics for semantic inference over event descriptions}}, journal = {Transactions of the Association for Computational Linguistics}, volume = {2}, pages = {67--78}, year = {2014}, doi = {10.1162/tacl_a_00166} } @article{mscoco, author = {Lin, Tsung-Yi and Maire, Michael and Belongie, Serge and Bourdev, Lubomir and Girshick, Ross and Hays, James and Perona, Pietro and Ramanan, Deva and Zitnick, C. Lawrence and Doll{\ifmmode\acute{a}\else\'{a}\fi}r, Piotr}, title = {{Microsoft COCO: Common Objects in Context}}, journal = {arXiv}, year = {2014}, month = may, eprint = {1405.0312}, doi = {10.48550/arXiv.1405.0312} } @inproceedings{im2text, author = {Ordonez, Vicente and Kulkarni, Girish and Berg, Tamara}, booktitle = {Advances in Neural Information Processing Systems}, editor = {J. Shawe-Taylor and R. Zemel and P. Bartlett and F. Pereira and K.Q. Weinberger}, pages = {}, publisher = {Curran Associates, Inc.}, title = {Im2Text: Describing Images Using 1 Million Captioned Photographs}, url = {https://proceedings.neurips.cc/paper/2011/file/5dd9db5e033da9c6fb5ba83c7a7ebea9-Paper.pdf}, volume = {24}, year = {2011} } @article{movie-summaries, author = {Bamman, David and O{'}Connor, Brendan and Smith, Noah A.}, title = {{Learning Latent Personas of Film Characters}}, journal = {ACL Anthology}, pages = {352--361}, year = {2013}, month = aug, url = {https://aclanthology.org/P13-1035} } @article{book-summaries, author = {Bamman, David and Smith, Noah A.}, title = {{New Alignment Methods for Discriminative Book Summarization}}, journal = {arXiv}, year = {2013}, month = may, eprint = {1305.1319}, doi = {10.48550/arXiv.1305.1319} } @inproceedings{gutenberg-dialogues, title = "The Gutenberg Dialogue Dataset", author = "Cs{\'a}ky, Rich{\'a}rd and Recski, G{\'a}bor", booktitle = "Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics", month = apr, year = "2021", publisher = "Association for Computational Linguistics", url = "https://arxiv.org/abs/2004.12752", } @article{wikitext, author = {Merity, Stephen and Xiong, Caiming and Bradbury, James and Socher, Richard}, title = {{Pointer Sentinel Mixture Models}}, journal = {arXiv}, year = {2016}, month = sep, urldate = {2025-11-15}, eprint = {1609.07843}, doi = {10.48550/arXiv.1609.07843} } @article{xsum, title={Don't Give Me the Details, Just the Summary! Topic-Aware Convolutional Neural Networks for Extreme Summarization}, author={Shashi Narayan and Shay B. Cohen and Mirella Lapata}, journal={ArXiv}, year={2018}, volume={abs/1808.08745} } @article{hotel-reviews, author = {Alam, {\relax Md}. Hijbul and Ryu, Woo-Jong and Lee, SangKeun}, title = {{Joint Multi-grain Topic Sentiment: Modeling Semantic Aspects for Online Reviews}}, journal = {Inform. Sci.}, volume = {339}, year = {2016}, month = jan, issn = {0020-0255}, publisher = {Elsevier BV}, doi = {10.1016/j.ins.2016.01.013} } @article{yelp-reviews, author = {Zhang, Xiang and Zhao, Junbo and LeCun, Yann}, title = {{Character-level Convolutional Networks for Text Classification}}, journal = {Advances in Neural Information Processing Systems}, volume = {28}, year = {2015}, url = {https://papers.nips.cc/paper_files/paper/2015/hash/250cf8b51c773f3f8dc8b4be867a9a02-Abstract.html} } @article{scientific-papers, title={A Discourse-Aware Attention Model for Abstractive Summarization of Long Documents}, url={http://dx.doi.org/10.18653/v1/n18-2097}, DOI={10.18653/v1/n18-2097}, journal={Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 2 (Short Papers)}, publisher={Association for Computational Linguistics}, author={Cohan, Arman and Dernoncourt, Franck and Kim, Doo Soon and Bui, Trung and Kim, Seokhwan and Chang, Walter and Goharian, Nazli}, year={2018} } @article{amazon-reviews, title={Bridging Language and Items for Retrieval and Recommendation}, author={Hou, Yupeng and Li, Jiacheng and He, Zhankui and Yan, An and Chen, Xiusi and McAuley, Julian}, journal={arXiv preprint arXiv:2403.03952}, year={2024} } ```

应用场景：