update literature

2d8ef71c · Tania Bladier · d2a51f8e · 2d8ef71c · 2d8ef71c · 2d8ef71c
Commit 2d8ef71c authored 6 months ago by Tania Bladier
--- a/2006.03189v1.pdf
+++ b/2006.03189v1.pdf
--- a/2303.16634v3.pdf
+++ b/2303.16634v3.pdf
--- a/2404.08008v1.pdf
+++ b/2404.08008v1.pdf
--- a/2405.18638v2.pdf
+++ b/2405.18638v2.pdf
--- a/2406.09056v3.pdf
+++ b/2406.09056v3.pdf
--- a/2409.16191v1.pdf
+++ b/2409.16191v1.pdf
--- a/amu-literature.bib
+++ b/amu-literature.bib
@@ -1167,6 +1167,73 @@
  groups  = {Groupe de lecture},
 }

+@Article{que2024hellobench,
+  author  = {Que, Haoran and Duan, Feiyu and He, Liqun and Mou, Yutao and Zhou, Wangchunshu and Liu, Jiaheng and Rong, Wenge and Wang, Zekun Moore and Yang, Jian and Zhang, Ge and others},
+  journal = {arXiv preprint arXiv:2409.16191},
+  title   = {Hellobench: Evaluating long text generation capabilities of large language models},
+  year    = {2024},
+  file    = {:2409.16191v1.pdf:PDF},
+  groups  = {evaluation},
+}
+
+@Article{feng2024sample,
+  author  = {Feng, Kehua and Ding, Keyan and Ma, Kede and Wang, Zhihua and Zhang, Qiang and Chen, Huajun},
+  journal = {arXiv preprint arXiv:2404.08008},
+  title   = {Sample-Efficient Human Evaluation of Large Language Models via Maximum Discrepancy Competition},
+  year    = {2024},
+  file    = {:2404.08008v1.pdf:PDF},
+  groups  = {evaluation},
+}
+
+@Article{tam2024framework,
+  author    = {Tam, Thomas Yu Chow and Sivarajkumar, Sonish and Kapoor, Sumit and Stolyar, Alisa V and Polanska, Katelyn and McCarthy, Karleigh R and Osterhoudt, Hunter and Wu, Xizhi and Visweswaran, Shyam and Fu, Sunyang and others},
+  journal   = {NPJ Digital Medicine},
+  title     = {A framework for human evaluation of large language models in healthcare derived from literature review},
+  year      = {2024},
+  number    = {1},
+  pages     = {258},
+  volume    = {7},
+  file      = {:s41746-024-01258-7.pdf:PDF},
+  groups    = {evaluation},
+  publisher = {Nature Publishing Group UK London},
+}
+
+@Article{elangovan2024considers,
+  author  = {Elangovan, Aparna and Liu, Ling and Xu, Lei and Bodapati, Sravan and Roth, Dan},
+  journal = {arXiv preprint arXiv:2405.18638},
+  title   = {ConSiDERS-The-Human Evaluation Framework: Rethinking Human Evaluation for Generative Large Language Models},
+  year    = {2024},
+  file    = {:2405.18638v2.pdf:PDF},
+  groups  = {evaluation},
+}
+
+@Article{tao2024cudrt,
+  author  = {Tao, Zhen and Li, Zhiyu and Xi, Dinghao and Xu, Wei},
+  journal = {arXiv preprint arXiv:2406.09056},
+  title   = {CUDRT: Benchmarking the Detection of Human vs. Large Language Models Generated Texts},
+  year    = {2024},
+  file    = {:2406.09056v3.pdf:PDF},
+  groups  = {evaluation},
+}
+
+@Article{ccano2020human,
+  author  = {{\c{C}}ano, Erion and Bojar, Ond{\v{r}}ej},
+  journal = {arXiv preprint arXiv:2006.03189},
+  title   = {Human or machine: Automating human likeliness evaluation of nlg texts},
+  year    = {2020},
+  file    = {:2006.03189v1.pdf:PDF},
+  groups  = {evaluation},
+}
+
+@Article{liu2023g,
+  author  = {Liu, Yang and Iter, Dan and Xu, Yichong and Wang, Shuohang and Xu, Ruochen and Zhu, Chenguang},
+  journal = {arXiv preprint arXiv:2303.16634},
+  title   = {G-eval: Nlg evaluation using gpt-4 with better human alignment},
+  year    = {2023},
+  file    = {:2303.16634v3.pdf:PDF},
+  groups  = {evaluation},
+}
+
 @Comment{jabref-meta: databaseType:bibtex;}

 @Comment{jabref-meta: grouping:
@@ -1177,10 +1244,10 @@
 2 StaticGroup:incremental-ml\;0\;1\;0x996699ff\;\;\;;
 1 StaticGroup:data\;0\;1\;0xcc3333ff\;\;\;;
 1 StaticGroup:evaluation\;0\;1\;0xffff4dff\;\;\;;
+2 StaticGroup:comparison-literary-texts\;0\;1\;0xcc6633ff\;\;\;;
 1 StaticGroup:read-asap\;0\;1\;0x488accff\;\;\;;
 2 StaticGroup:alexis' papers\;0\;1\;0x4d8080ff\;\;\;;
 1 StaticGroup:misc\;0\;0\;0xb3e6b3ff\;\;\;;
 1 StaticGroup:Groupe de lecture\;0\;1\;0x00ffffff\;\;\;;
 1 StaticGroup:Tokenization\;0\;1\;0xd74ecbff\;\;\;;
-1 StaticGroup:comparison-literary-texts\;0\;1\;0xcc6633ff\;\;\;;
 }
--- a/s41746-024-01258-7.pdf
+++ b/s41746-024-01258-7.pdf