Add ParseBench evaluation results

#26
Files changed (1) hide show
  1. .eval_results/parsebench.yaml +60 -0
.eval_results/parsebench.yaml ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - dataset:
2
+ id: llamaindex/ParseBench
3
+ task_id: mean
4
+ value: 44.1
5
+ date: '2026-04-16'
6
+ source:
7
+ url: https://huggingface.co/datasets/llamaindex/ParseBench
8
+ name: ParseBench
9
+ user: boyang-runllama
10
+ notes: "Pipeline name: qwen3_6_35b_a3b_fp8_vllm_parse_layout"
11
+ - dataset:
12
+ id: llamaindex/ParseBench
13
+ task_id: text_content
14
+ value: 90.7
15
+ date: '2026-04-16'
16
+ source:
17
+ url: https://huggingface.co/datasets/llamaindex/ParseBench
18
+ name: ParseBench
19
+ user: boyang-runllama
20
+ notes: "Pipeline name: qwen3_6_35b_a3b_fp8_vllm_parse_layout"
21
+ - dataset:
22
+ id: llamaindex/ParseBench
23
+ task_id: text_formatting
24
+ value: 58.3
25
+ date: '2026-04-16'
26
+ source:
27
+ url: https://huggingface.co/datasets/llamaindex/ParseBench
28
+ name: ParseBench
29
+ user: boyang-runllama
30
+ notes: "Pipeline name: qwen3_6_35b_a3b_fp8_vllm_parse_layout"
31
+ - dataset:
32
+ id: llamaindex/ParseBench
33
+ task_id: layout
34
+ value: 47.4
35
+ date: '2026-04-16'
36
+ source:
37
+ url: https://huggingface.co/datasets/llamaindex/ParseBench
38
+ name: ParseBench
39
+ user: boyang-runllama
40
+ notes: "Pipeline name: qwen3_6_35b_a3b_fp8_vllm_parse_layout"
41
+ - dataset:
42
+ id: llamaindex/ParseBench
43
+ task_id: chart
44
+ value: 5.1
45
+ date: '2026-04-16'
46
+ source:
47
+ url: https://huggingface.co/datasets/llamaindex/ParseBench
48
+ name: ParseBench
49
+ user: boyang-runllama
50
+ notes: "Pipeline name: qwen3_6_35b_a3b_fp8_vllm_parse_layout"
51
+ - dataset:
52
+ id: llamaindex/ParseBench
53
+ task_id: table
54
+ value: 19.1
55
+ date: '2026-04-16'
56
+ source:
57
+ url: https://huggingface.co/datasets/llamaindex/ParseBench
58
+ name: ParseBench
59
+ user: boyang-runllama
60
+ notes: "Pipeline name: qwen3_6_35b_a3b_fp8_vllm_parse_layout"