-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathenhanced_extraction_performance.json
More file actions
74 lines (74 loc) · 1.64 KB
/
enhanced_extraction_performance.json
File metadata and controls
74 lines (74 loc) · 1.64 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
{
"evaluation_summary": {
"sample_size": 200,
"success_rate_percent": 100.0,
"avg_ingredients_per_file": 11.6,
"avg_instruction_length": 587.1161616161617,
"files_with_instructions_percent": 99.0
},
"quality_distribution": {
"medium": 57,
"high": 89,
"very_low": 25,
"low": 29
},
"source_performance": {
"ccap": {
"files": 9,
"ingredients": 48,
"avg_ingredients": 5.333333333333333
},
"dsmz": {
"files": 191,
"ingredients": 2272,
"avg_ingredients": 11.895287958115183
}
},
"extraction_methods": {
"list": 1171,
"tabular": 1128,
"inline": 21
},
"sample_results": [
{
"file": "ccap_MDY_V.md",
"medium_name": "Ccap Mdy V",
"source": "ccap",
"ingredients": 7,
"has_instructions": true,
"instruction_length": 730
},
{
"file": "dsmz_1313.md",
"medium_name": "Solution A:",
"source": "dsmz",
"ingredients": 22,
"has_instructions": true,
"instruction_length": 258
},
{
"file": "dsmz_343.md",
"medium_name": "343: THERMOTOGA NEAPOLITANA MEDIUM",
"source": "dsmz",
"ingredients": 33,
"has_instructions": true,
"instruction_length": 702
},
{
"file": "dsmz_1227.md",
"medium_name": "Dsmz 1227",
"source": "dsmz",
"ingredients": 19,
"has_instructions": true,
"instruction_length": 400
},
{
"file": "dsmz_1304.md",
"medium_name": "1304: SULFURITALEA MEDIUM",
"source": "dsmz",
"ingredients": 9,
"has_instructions": true,
"instruction_length": 1744
}
]
}