Spaces:
Running
Running
Commit
·
ccceff6
1
Parent(s):
0b870a2
refactor: Simplify New Evaluation screen for hackathon
Browse filesRemove fields that don't work in containerized HF Jobs/Modal environments:
- Prompt Configuration (YAML) field
- MCP Server URL field
- Additional Imports field
- Working Directory field
These fields require host-level file system access and environment configuration
that isn't available in container-based evaluation jobs. Simplified form now
only includes parameters that work reliably in both HF Jobs and Modal compute.
app.py
CHANGED
|
@@ -2292,25 +2292,6 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
|
|
| 2292 |
info="Select additional tools to enable for the agent"
|
| 2293 |
)
|
| 2294 |
|
| 2295 |
-
with gr.Row():
|
| 2296 |
-
eval_prompt_yml = gr.Textbox(
|
| 2297 |
-
label="Prompt Configuration (YAML)",
|
| 2298 |
-
info="Path to prompt configuration file (optional)",
|
| 2299 |
-
placeholder="path/to/prompt.yml"
|
| 2300 |
-
)
|
| 2301 |
-
|
| 2302 |
-
eval_mcp_server_url = gr.Textbox(
|
| 2303 |
-
label="MCP Server URL",
|
| 2304 |
-
info="Model Context Protocol server URL (optional)",
|
| 2305 |
-
placeholder="http://localhost:8080"
|
| 2306 |
-
)
|
| 2307 |
-
|
| 2308 |
-
eval_additional_imports = gr.Textbox(
|
| 2309 |
-
label="Additional Imports",
|
| 2310 |
-
info="Comma-separated list of Python modules for CodeAgent (optional)",
|
| 2311 |
-
placeholder="numpy,pandas,requests"
|
| 2312 |
-
)
|
| 2313 |
-
|
| 2314 |
# Section 4: Test Configuration
|
| 2315 |
with gr.Accordion("🧪 Test Configuration", open=True):
|
| 2316 |
gr.Markdown("*Configure test dataset and execution parameters*")
|
|
@@ -2344,12 +2325,6 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
|
|
| 2344 |
maximum=10
|
| 2345 |
)
|
| 2346 |
|
| 2347 |
-
eval_working_directory = gr.Textbox(
|
| 2348 |
-
label="Working Directory",
|
| 2349 |
-
info="Working directory for file tools (optional)",
|
| 2350 |
-
placeholder="/tmp/agent_workspace"
|
| 2351 |
-
)
|
| 2352 |
-
|
| 2353 |
# Section 5: Output & Monitoring Configuration
|
| 2354 |
with gr.Accordion("📊 Output & Monitoring", open=True):
|
| 2355 |
gr.Markdown("*Configure output format and monitoring options*")
|
|
@@ -2538,9 +2513,9 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
|
|
| 2538 |
# Model Configuration
|
| 2539 |
model, provider, hf_inference_provider, hf_token,
|
| 2540 |
# Agent Configuration
|
| 2541 |
-
agent_type, search_provider, enable_tools,
|
| 2542 |
# Test Configuration
|
| 2543 |
-
dataset_name, split, difficulty, parallel_workers,
|
| 2544 |
# Output & Monitoring
|
| 2545 |
output_format, output_dir, enable_otel, enable_gpu_metrics, private, debug, quiet, run_id
|
| 2546 |
):
|
|
@@ -2569,12 +2544,6 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
|
|
| 2569 |
cli_command_parts.append("--hf-token $HF_TOKEN")
|
| 2570 |
|
| 2571 |
cli_command_parts.append(f"--agent-type {agent_type}")
|
| 2572 |
-
if prompt_yml:
|
| 2573 |
-
cli_command_parts.append(f"--prompt-yml {prompt_yml}")
|
| 2574 |
-
if mcp_server_url:
|
| 2575 |
-
cli_command_parts.append(f"--mcp-server-url {mcp_server_url}")
|
| 2576 |
-
if additional_imports:
|
| 2577 |
-
cli_command_parts.append(f"--additional-imports {additional_imports}")
|
| 2578 |
|
| 2579 |
cli_command_parts.append(f"--dataset-name {dataset_name}")
|
| 2580 |
cli_command_parts.append(f"--split {split}")
|
|
@@ -2582,8 +2551,6 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
|
|
| 2582 |
cli_command_parts.append(f"--difficulty {difficulty}")
|
| 2583 |
if parallel_workers > 1:
|
| 2584 |
cli_command_parts.append(f"--parallel-workers {parallel_workers}")
|
| 2585 |
-
if working_directory:
|
| 2586 |
-
cli_command_parts.append(f"--working-directory {working_directory}")
|
| 2587 |
|
| 2588 |
cli_command_parts.append(f"--output-format {output_format}")
|
| 2589 |
if output_dir and output_format == "json":
|
|
@@ -3259,9 +3226,9 @@ Result: {result}
|
|
| 3259 |
# Model Configuration
|
| 3260 |
eval_model, eval_provider, eval_hf_inference_provider, eval_hf_token,
|
| 3261 |
# Agent Configuration
|
| 3262 |
-
eval_agent_type, eval_search_provider, eval_enable_tools,
|
| 3263 |
# Test Configuration
|
| 3264 |
-
eval_dataset_name, eval_split, eval_difficulty, eval_parallel_workers,
|
| 3265 |
# Output & Monitoring
|
| 3266 |
eval_output_format, eval_output_dir, eval_enable_otel, eval_enable_gpu_metrics, eval_private, eval_debug, eval_quiet, eval_run_id
|
| 3267 |
],
|
|
|
|
| 2292 |
info="Select additional tools to enable for the agent"
|
| 2293 |
)
|
| 2294 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2295 |
# Section 4: Test Configuration
|
| 2296 |
with gr.Accordion("🧪 Test Configuration", open=True):
|
| 2297 |
gr.Markdown("*Configure test dataset and execution parameters*")
|
|
|
|
| 2325 |
maximum=10
|
| 2326 |
)
|
| 2327 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2328 |
# Section 5: Output & Monitoring Configuration
|
| 2329 |
with gr.Accordion("📊 Output & Monitoring", open=True):
|
| 2330 |
gr.Markdown("*Configure output format and monitoring options*")
|
|
|
|
| 2513 |
# Model Configuration
|
| 2514 |
model, provider, hf_inference_provider, hf_token,
|
| 2515 |
# Agent Configuration
|
| 2516 |
+
agent_type, search_provider, enable_tools,
|
| 2517 |
# Test Configuration
|
| 2518 |
+
dataset_name, split, difficulty, parallel_workers,
|
| 2519 |
# Output & Monitoring
|
| 2520 |
output_format, output_dir, enable_otel, enable_gpu_metrics, private, debug, quiet, run_id
|
| 2521 |
):
|
|
|
|
| 2544 |
cli_command_parts.append("--hf-token $HF_TOKEN")
|
| 2545 |
|
| 2546 |
cli_command_parts.append(f"--agent-type {agent_type}")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2547 |
|
| 2548 |
cli_command_parts.append(f"--dataset-name {dataset_name}")
|
| 2549 |
cli_command_parts.append(f"--split {split}")
|
|
|
|
| 2551 |
cli_command_parts.append(f"--difficulty {difficulty}")
|
| 2552 |
if parallel_workers > 1:
|
| 2553 |
cli_command_parts.append(f"--parallel-workers {parallel_workers}")
|
|
|
|
|
|
|
| 2554 |
|
| 2555 |
cli_command_parts.append(f"--output-format {output_format}")
|
| 2556 |
if output_dir and output_format == "json":
|
|
|
|
| 3226 |
# Model Configuration
|
| 3227 |
eval_model, eval_provider, eval_hf_inference_provider, eval_hf_token,
|
| 3228 |
# Agent Configuration
|
| 3229 |
+
eval_agent_type, eval_search_provider, eval_enable_tools,
|
| 3230 |
# Test Configuration
|
| 3231 |
+
eval_dataset_name, eval_split, eval_difficulty, eval_parallel_workers,
|
| 3232 |
# Output & Monitoring
|
| 3233 |
eval_output_format, eval_output_dir, eval_enable_otel, eval_enable_gpu_metrics, eval_private, eval_debug, eval_quiet, eval_run_id
|
| 3234 |
],
|