@article{yu2023rlhf, title={Rlhf-v: Towards trustworthy mllms via behavior alignment from fine-grained correctional human feedback}, author={Yu, Tianyu and Yao, Yuan and Zhang, Haoye and He, Taiwen and Han, Yifeng and Cui, Ganqu and Hu, Jinyi and Liu, Zhiyuan and Zheng, Hai-Tao and Sun, Maosong and others}, journal={arXiv preprint arXiv:2312.00849}, year={2023} } @article{yu2024rlaifv, title={RLAIF-V: Open-Source AI Feedback Leads to Super GPT-4V Trustworthiness}, author={Tianyu Yu and Haoye Zhang and Qiming Li and Qixin Xu and Yuan Yao and Da Chen and Xiaoman Lu and Ganqu Cui and Yunkai Dang and Taiwen He and Xiaocheng Feng and Jun Song and Bo Zheng and Zhiyuan Liu and Tat-Seng Chua and Maosong Sun}, journal={arXiv preprint arXiv:2405.17220}, year={2024}, } @misc{yu2025minicpmv45cookingefficient, title={MiniCPM-V 4.5: Cooking Efficient MLLMs via Architecture, Data, and Training Recipe}, author={Tianyu Yu and Zefan Wang and Chongyi Wang and Fuwei Huang and Wenshuo Ma and Zhihui He and Tianchi Cai and Weize Chen and Yuxiang Huang and Yuanqian Zhao and Bokai Xu and Junbo Cui and Yingjing Xu and Liqing Ruan and Luoyuan Zhang and Hanyu Liu and Jingkun Tang and Hongyuan Liu and Qining Guo and Wenhao Hu and Bingxiang He and Jie Zhou and Jie Cai and Ji Qi and Zonghao Guo and Chi Chen and Guoyang Zeng and Yuxuan Li and Ganqu Cui and Ning Ding and Xu Han and Yuan Yao and Zhiyuan Liu and Maosong Sun}, year={2025}, eprint={2509.18154}, archivePrefix={arXiv}, primaryClass={cs.LG}, url={https://arxiv.org/abs/2509.18154}, }

Date

2 years ago

Size

11.77 GB

Organization

Paper URL

arxiv.org

Citation

@article{yu2023rlhf,
title={Rlhf-v: Towards trustworthy mllms via behavior alignment from fine-grained correctional human feedback},
author={Yu, Tianyu and Yao, Yuan and Zhang, Haoye and He, Taiwen and Han, Yifeng and Cui, Ganqu and Hu, Jinyi and Liu, Zhiyuan and Zheng, Hai-Tao and Sun, Maosong and others},
journal={arXiv preprint arXiv:2312.00849},
year={2023}
}
@article{yu2024rlaifv,
title={RLAIF-V: Open-Source AI Feedback Leads to Super GPT-4V Trustworthiness},
author={Tianyu Yu and Haoye Zhang and Qiming Li and Qixin Xu and Yuan Yao and Da Chen and Xiaoman Lu and Ganqu Cui and Yunkai Dang and Taiwen He and Xiaocheng Feng and Jun Song and Bo Zheng and Zhiyuan Liu and Tat-Seng Chua and Maosong Sun},
journal={arXiv preprint arXiv:2405.17220},
year={2024},
}
@misc{yu2025minicpmv45cookingefficient,
title={MiniCPM-V 4.5: Cooking Efficient MLLMs via Architecture, Data, and Training Recipe},
author={Tianyu Yu and Zefan Wang and Chongyi Wang and Fuwei Huang and Wenshuo Ma and Zhihui He and Tianchi Cai and Weize Chen and Yuxiang Huang and Yuanqian Zhao and Bokai Xu and Junbo Cui and Yingjing Xu and Liqing Ruan and Luoyuan Zhang and Hanyu Liu and Jingkun Tang and Hongyuan Liu and Qining Guo and Wenhao Hu and Bingxiang He and Jie Zhou and Jie Cai and Ji Qi and Zonghao Guo and Chi Chen and Guoyang Zeng and Yuxuan Li and Ganqu Cui and Ning Ding and Xu Han and Yuan Yao and Zhiyuan Liu and Maosong Sun},
year={2025},
eprint={2509.18154},
archivePrefix={arXiv},
primaryClass={cs.LG},
url={https://arxiv.org/abs/2509.18154},
}

RLAIF-V-Dataset.torrent

Seeding 1Downloading 0Completed 215Total Downloads 307

RLAIF-V-Dataset/
- README.md
  1.86 KB
- README.txt
  3.72 KB

This dataset is contributed by community users and is intended for educational and informational purposes only. If any content involves copyright infringement, please contact us at [email protected] for prompt review and removal.

Related Datasets

FigureBench Scientific Illustration Generation Benchmark Dataset

Command Palette

RLAIF-V-Dataset Large-scale Multimodal Preference Dataset

Citation

Build AI with AI

HyperAI Newsletters

Command Palette

RLAIF-V-Dataset Large-scale Multimodal Preference Dataset

Citation

Related Datasets

MAKIEVAL Multilingual Cultural Knowledge Assessment Dataset

Verbatim Spans Query Condition Evidence Extraction Dataset

SAM 3D Artist Objects 3D Object Reconstruction Dataset

FigureBench Scientific Illustration Generation Benchmark Dataset

TACK Targeted Chimera Knowledge Base Dataset

EAVSD E-commerce Advertising Video Storyboard Dataset

DeepCrack Infrastructure Crack Detection Dataset

SMOL Multilingual Translation Parallel Dataset

chi-bench Medical Intelligent Agent Benchmark Evaluation Dataset

ViMU Video Metaphor Understanding Dataset

MemLens Multimodal Long Context Benchmark Dataset

AgentTrove Intelligent Agent Interaction Trajectory Dataset

MathNet Multimodal Mathematical Benchmark Inference Dataset

Claw-Eval Real-World Benchmark Dataset

Long-Distance Wildfire & Smoke Detection Dataset

QCalEval Quantum Calibration Graph Understanding Dataset

RSRCC Remote Sensing Area Change Understanding Benchmark Dataset

BRIGHT Disaster Building Assessment Dataset

OmniParsingBench Multimodal Parsing Capability Evaluation Dataset

MDPBench Multilingual Document Parsing Benchmark Dataset

Build AI with AI

HyperAI Newsletters

Command Palette

RLAIF-V-Dataset Large-scale Multimodal Preference Dataset

Citation

Related Datasets

MAKIEVAL Multilingual Cultural Knowledge Assessment Dataset

Verbatim Spans Query Condition Evidence Extraction Dataset

SAM 3D Artist Objects 3D Object Reconstruction Dataset

FigureBench Scientific Illustration Generation Benchmark Dataset

TACK Targeted Chimera Knowledge Base Dataset

EAVSD E-commerce Advertising Video Storyboard Dataset

DeepCrack Infrastructure Crack Detection Dataset

SMOL Multilingual Translation Parallel Dataset

chi-bench Medical Intelligent Agent Benchmark Evaluation Dataset

ViMU Video Metaphor Understanding Dataset

MemLens Multimodal Long Context Benchmark Dataset

AgentTrove Intelligent Agent Interaction Trajectory Dataset

MathNet Multimodal Mathematical Benchmark Inference Dataset

Claw-Eval Real-World Benchmark Dataset

Long-Distance Wildfire & Smoke Detection Dataset

QCalEval Quantum Calibration Graph Understanding Dataset

RSRCC Remote Sensing Area Change Understanding Benchmark Dataset

BRIGHT Disaster Building Assessment Dataset

OmniParsingBench Multimodal Parsing Capability Evaluation Dataset

MDPBench Multilingual Document Parsing Benchmark Dataset

Build AI with AI

HyperAI Newsletters

Related Datasets

MAKIEVAL Multilingual Cultural Knowledge Assessment Dataset

Verbatim Spans Query Condition Evidence Extraction Dataset

SAM 3D Artist Objects 3D Object Reconstruction Dataset

FigureBench Scientific Illustration Generation Benchmark Dataset

TACK Targeted Chimera Knowledge Base Dataset

EAVSD E-commerce Advertising Video Storyboard Dataset

DeepCrack Infrastructure Crack Detection Dataset

SMOL Multilingual Translation Parallel Dataset

chi-bench Medical Intelligent Agent Benchmark Evaluation Dataset

ViMU Video Metaphor Understanding Dataset

MemLens Multimodal Long Context Benchmark Dataset

AgentTrove Intelligent Agent Interaction Trajectory Dataset

MathNet Multimodal Mathematical Benchmark Inference Dataset

Claw-Eval Real-World Benchmark Dataset

Long-Distance Wildfire & Smoke Detection Dataset

QCalEval Quantum Calibration Graph Understanding Dataset

RSRCC Remote Sensing Area Change Understanding Benchmark Dataset

BRIGHT Disaster Building Assessment Dataset

OmniParsingBench Multimodal Parsing Capability Evaluation Dataset

MDPBench Multilingual Document Parsing Benchmark Dataset

Related Datasets

MAKIEVAL Multilingual Cultural Knowledge Assessment Dataset