github-actions[bot] commited on
Commit ·
ca3cd0c
1
Parent(s): b60f14f
Update leaderboard from GitHub main branch
Browse files- app.py +3 -3
- auto_eval.py +6 -4
app.py
CHANGED
|
@@ -297,7 +297,7 @@ with gr.Blocks(css=custom_css, title="LLM Enzyme Kinetics Extraction Benchmark")
|
|
| 297 |
label="Model Provider"
|
| 298 |
)
|
| 299 |
ocr_type_dropdown = gr.Dropdown(
|
| 300 |
-
choices=["All", "mathpix", "kimi", "pymupdf"],
|
| 301 |
value="All",
|
| 302 |
label="OCR Type"
|
| 303 |
)
|
|
@@ -424,7 +424,7 @@ with gr.Blocks(css=custom_css, title="LLM Enzyme Kinetics Extraction Benchmark")
|
|
| 424 |
|
| 425 |
with gr.Row():
|
| 426 |
ocr_type_input = gr.Dropdown(
|
| 427 |
-
choices=["mathpix", "kimi", "pymupdf"],
|
| 428 |
value="mathpix",
|
| 429 |
label="OCR Type *",
|
| 430 |
info="Which OCR version to use for evaluation"
|
|
@@ -579,7 +579,7 @@ with gr.Blocks(css=custom_css, title="LLM Enzyme Kinetics Extraction Benchmark")
|
|
| 579 |
|
| 580 |
with gr.Row():
|
| 581 |
ocr_type_input = gr.Dropdown(
|
| 582 |
-
choices=["mathpix", "kimi", "pymupdf"],
|
| 583 |
label="OCR Type *"
|
| 584 |
)
|
| 585 |
submitter_input = gr.Textbox(label="Submitter Name/Email *", placeholder="Your name or contact")
|
|
|
|
| 297 |
label="Model Provider"
|
| 298 |
)
|
| 299 |
ocr_type_dropdown = gr.Dropdown(
|
| 300 |
+
choices=["All", "mathpix", "kimi", "pymupdf", "glm_ocr"],
|
| 301 |
value="All",
|
| 302 |
label="OCR Type"
|
| 303 |
)
|
|
|
|
| 424 |
|
| 425 |
with gr.Row():
|
| 426 |
ocr_type_input = gr.Dropdown(
|
| 427 |
+
choices=["mathpix", "kimi", "pymupdf", "glm_ocr"],
|
| 428 |
value="mathpix",
|
| 429 |
label="OCR Type *",
|
| 430 |
info="Which OCR version to use for evaluation"
|
|
|
|
| 579 |
|
| 580 |
with gr.Row():
|
| 581 |
ocr_type_input = gr.Dropdown(
|
| 582 |
+
choices=["mathpix", "kimi", "pymupdf", "glm_ocr"],
|
| 583 |
label="OCR Type *"
|
| 584 |
)
|
| 585 |
submitter_input = gr.Textbox(label="Submitter Name/Email *", placeholder="Your name or contact")
|
auto_eval.py
CHANGED
|
@@ -41,7 +41,7 @@ class BenchmarkEvaluator:
|
|
| 41 |
api_base: API base URL
|
| 42 |
model_name: Model name
|
| 43 |
provider: Provider name (OpenAI, Anthropic, etc.)
|
| 44 |
-
ocr_type: OCR type (mathpix, kimi, pymupdf)
|
| 45 |
submitter: Submitter name/email
|
| 46 |
num_papers: Number of papers to evaluate (default: 5 for testing)
|
| 47 |
|
|
@@ -110,19 +110,21 @@ def main():
|
|
| 110 |
|
| 111 |
print(f"Found {len(papers)} papers to evaluate")
|
| 112 |
|
| 113 |
-
# Initialize extractor
|
| 114 |
provider = os.getenv('LLM_PROVIDER', 'openai').lower()
|
| 115 |
if provider == 'openai':
|
| 116 |
extractor = OpenAIExtractor(
|
| 117 |
api_key=os.getenv('OPENAI_API_KEY'),
|
| 118 |
base_url=os.getenv('OPENAI_API_BASE'),
|
| 119 |
-
model=os.getenv('OPENAI_MODEL')
|
|
|
|
| 120 |
)
|
| 121 |
else:
|
| 122 |
extractor = AnthropicExtractor(
|
| 123 |
api_key=os.getenv('ANTHROPIC_API_KEY'),
|
| 124 |
base_url=os.getenv('ANTHROPIC_API_BASE'),
|
| 125 |
-
model=os.getenv('ANTHROPIC_MODEL')
|
|
|
|
| 126 |
)
|
| 127 |
|
| 128 |
# Run extraction
|
|
|
|
| 41 |
api_base: API base URL
|
| 42 |
model_name: Model name
|
| 43 |
provider: Provider name (OpenAI, Anthropic, etc.)
|
| 44 |
+
ocr_type: OCR type (mathpix, kimi, pymupdf, glm_ocr)
|
| 45 |
submitter: Submitter name/email
|
| 46 |
num_papers: Number of papers to evaluate (default: 5 for testing)
|
| 47 |
|
|
|
|
| 110 |
|
| 111 |
print(f"Found {len(papers)} papers to evaluate")
|
| 112 |
|
| 113 |
+
# Initialize extractor with optimizations enabled
|
| 114 |
provider = os.getenv('LLM_PROVIDER', 'openai').lower()
|
| 115 |
if provider == 'openai':
|
| 116 |
extractor = OpenAIExtractor(
|
| 117 |
api_key=os.getenv('OPENAI_API_KEY'),
|
| 118 |
base_url=os.getenv('OPENAI_API_BASE'),
|
| 119 |
+
model=os.getenv('OPENAI_MODEL'),
|
| 120 |
+
use_stream=True # Enable streaming for faster response
|
| 121 |
)
|
| 122 |
else:
|
| 123 |
extractor = AnthropicExtractor(
|
| 124 |
api_key=os.getenv('ANTHROPIC_API_KEY'),
|
| 125 |
base_url=os.getenv('ANTHROPIC_API_BASE'),
|
| 126 |
+
model=os.getenv('ANTHROPIC_MODEL'),
|
| 127 |
+
use_stream=True # Enable streaming for faster response
|
| 128 |
)
|
| 129 |
|
| 130 |
# Run extraction
|