Skip to content
Snippets Groups Projects
Commit 2d8ef71c authored by Tania Bladier's avatar Tania Bladier
Browse files

update literature

parent d2a51f8e
No related branches found
No related tags found
No related merge requests found
File added
File added
File added
File added
File added
File added
......@@ -1167,6 +1167,73 @@
groups = {Groupe de lecture},
}
@Article{que2024hellobench,
author = {Que, Haoran and Duan, Feiyu and He, Liqun and Mou, Yutao and Zhou, Wangchunshu and Liu, Jiaheng and Rong, Wenge and Wang, Zekun Moore and Yang, Jian and Zhang, Ge and others},
journal = {arXiv preprint arXiv:2409.16191},
title = {Hellobench: Evaluating long text generation capabilities of large language models},
year = {2024},
file = {:2409.16191v1.pdf:PDF},
groups = {evaluation},
}
@Article{feng2024sample,
author = {Feng, Kehua and Ding, Keyan and Ma, Kede and Wang, Zhihua and Zhang, Qiang and Chen, Huajun},
journal = {arXiv preprint arXiv:2404.08008},
title = {Sample-Efficient Human Evaluation of Large Language Models via Maximum Discrepancy Competition},
year = {2024},
file = {:2404.08008v1.pdf:PDF},
groups = {evaluation},
}
@Article{tam2024framework,
author = {Tam, Thomas Yu Chow and Sivarajkumar, Sonish and Kapoor, Sumit and Stolyar, Alisa V and Polanska, Katelyn and McCarthy, Karleigh R and Osterhoudt, Hunter and Wu, Xizhi and Visweswaran, Shyam and Fu, Sunyang and others},
journal = {NPJ Digital Medicine},
title = {A framework for human evaluation of large language models in healthcare derived from literature review},
year = {2024},
number = {1},
pages = {258},
volume = {7},
file = {:s41746-024-01258-7.pdf:PDF},
groups = {evaluation},
publisher = {Nature Publishing Group UK London},
}
@Article{elangovan2024considers,
author = {Elangovan, Aparna and Liu, Ling and Xu, Lei and Bodapati, Sravan and Roth, Dan},
journal = {arXiv preprint arXiv:2405.18638},
title = {ConSiDERS-The-Human Evaluation Framework: Rethinking Human Evaluation for Generative Large Language Models},
year = {2024},
file = {:2405.18638v2.pdf:PDF},
groups = {evaluation},
}
@Article{tao2024cudrt,
author = {Tao, Zhen and Li, Zhiyu and Xi, Dinghao and Xu, Wei},
journal = {arXiv preprint arXiv:2406.09056},
title = {CUDRT: Benchmarking the Detection of Human vs. Large Language Models Generated Texts},
year = {2024},
file = {:2406.09056v3.pdf:PDF},
groups = {evaluation},
}
@Article{ccano2020human,
author = {{\c{C}}ano, Erion and Bojar, Ond{\v{r}}ej},
journal = {arXiv preprint arXiv:2006.03189},
title = {Human or machine: Automating human likeliness evaluation of nlg texts},
year = {2020},
file = {:2006.03189v1.pdf:PDF},
groups = {evaluation},
}
@Article{liu2023g,
author = {Liu, Yang and Iter, Dan and Xu, Yichong and Wang, Shuohang and Xu, Ruochen and Zhu, Chenguang},
journal = {arXiv preprint arXiv:2303.16634},
title = {G-eval: Nlg evaluation using gpt-4 with better human alignment},
year = {2023},
file = {:2303.16634v3.pdf:PDF},
groups = {evaluation},
}
@Comment{jabref-meta: databaseType:bibtex;}
@Comment{jabref-meta: grouping:
......@@ -1177,10 +1244,10 @@
2 StaticGroup:incremental-ml\;0\;1\;0x996699ff\;\;\;;
1 StaticGroup:data\;0\;1\;0xcc3333ff\;\;\;;
1 StaticGroup:evaluation\;0\;1\;0xffff4dff\;\;\;;
2 StaticGroup:comparison-literary-texts\;0\;1\;0xcc6633ff\;\;\;;
1 StaticGroup:read-asap\;0\;1\;0x488accff\;\;\;;
2 StaticGroup:alexis' papers\;0\;1\;0x4d8080ff\;\;\;;
1 StaticGroup:misc\;0\;0\;0xb3e6b3ff\;\;\;;
1 StaticGroup:Groupe de lecture\;0\;1\;0x00ffffff\;\;\;;
1 StaticGroup:Tokenization\;0\;1\;0xd74ecbff\;\;\;;
1 StaticGroup:comparison-literary-texts\;0\;1\;0xcc6633ff\;\;\;;
}
This diff is collapsed.
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment