File size: 393 Bytes
460d762
b2c063a
 
85dbbc4
fe6d73e
 
460d762
0227006
 
 
99b25b8
 
 
58b9de9
 
dcf13df
8135339
 
99b25b8
 
150bb15
6632750
150bb15
5c4aa1e
8135339
5c4aa1e
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
auto_evals/
venv/
__pycache__/
.env
.ipynb_checkpoints
*ipynb
.vscode/

gpt_4_evals/
human_evals/
eval-queue/
eval-results/
auto_evals/
eval-queue-bk/
eval-results-bk/
eval-results-bk_hhem21/
eval-results_hhem21/
hhem21_server/

src/assets/model_counts.html

generation_results/
Hallucination Leaderboard Results
dataset_stats.py
hhem_v21_eval.py

get_comparison.py
GPT-4-Turbo_v.s._GPT-4o.csv