kshitijthakkar commited on
Commit
ccceff6
·
1 Parent(s): 0b870a2

refactor: Simplify New Evaluation screen for hackathon

Browse files

Remove fields that don't work in containerized HF Jobs/Modal environments:
- Prompt Configuration (YAML) field
- MCP Server URL field
- Additional Imports field
- Working Directory field

These fields require host-level file system access and environment configuration
that isn't available in container-based evaluation jobs. Simplified form now
only includes parameters that work reliably in both HF Jobs and Modal compute.

Files changed (1) hide show
  1. app.py +4 -37
app.py CHANGED
@@ -2292,25 +2292,6 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
2292
  info="Select additional tools to enable for the agent"
2293
  )
2294
 
2295
- with gr.Row():
2296
- eval_prompt_yml = gr.Textbox(
2297
- label="Prompt Configuration (YAML)",
2298
- info="Path to prompt configuration file (optional)",
2299
- placeholder="path/to/prompt.yml"
2300
- )
2301
-
2302
- eval_mcp_server_url = gr.Textbox(
2303
- label="MCP Server URL",
2304
- info="Model Context Protocol server URL (optional)",
2305
- placeholder="http://localhost:8080"
2306
- )
2307
-
2308
- eval_additional_imports = gr.Textbox(
2309
- label="Additional Imports",
2310
- info="Comma-separated list of Python modules for CodeAgent (optional)",
2311
- placeholder="numpy,pandas,requests"
2312
- )
2313
-
2314
  # Section 4: Test Configuration
2315
  with gr.Accordion("🧪 Test Configuration", open=True):
2316
  gr.Markdown("*Configure test dataset and execution parameters*")
@@ -2344,12 +2325,6 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
2344
  maximum=10
2345
  )
2346
 
2347
- eval_working_directory = gr.Textbox(
2348
- label="Working Directory",
2349
- info="Working directory for file tools (optional)",
2350
- placeholder="/tmp/agent_workspace"
2351
- )
2352
-
2353
  # Section 5: Output & Monitoring Configuration
2354
  with gr.Accordion("📊 Output & Monitoring", open=True):
2355
  gr.Markdown("*Configure output format and monitoring options*")
@@ -2538,9 +2513,9 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
2538
  # Model Configuration
2539
  model, provider, hf_inference_provider, hf_token,
2540
  # Agent Configuration
2541
- agent_type, search_provider, enable_tools, prompt_yml, mcp_server_url, additional_imports,
2542
  # Test Configuration
2543
- dataset_name, split, difficulty, parallel_workers, working_directory,
2544
  # Output & Monitoring
2545
  output_format, output_dir, enable_otel, enable_gpu_metrics, private, debug, quiet, run_id
2546
  ):
@@ -2569,12 +2544,6 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
2569
  cli_command_parts.append("--hf-token $HF_TOKEN")
2570
 
2571
  cli_command_parts.append(f"--agent-type {agent_type}")
2572
- if prompt_yml:
2573
- cli_command_parts.append(f"--prompt-yml {prompt_yml}")
2574
- if mcp_server_url:
2575
- cli_command_parts.append(f"--mcp-server-url {mcp_server_url}")
2576
- if additional_imports:
2577
- cli_command_parts.append(f"--additional-imports {additional_imports}")
2578
 
2579
  cli_command_parts.append(f"--dataset-name {dataset_name}")
2580
  cli_command_parts.append(f"--split {split}")
@@ -2582,8 +2551,6 @@ with gr.Blocks(title="TraceMind-AI", theme=theme) as app:
2582
  cli_command_parts.append(f"--difficulty {difficulty}")
2583
  if parallel_workers > 1:
2584
  cli_command_parts.append(f"--parallel-workers {parallel_workers}")
2585
- if working_directory:
2586
- cli_command_parts.append(f"--working-directory {working_directory}")
2587
 
2588
  cli_command_parts.append(f"--output-format {output_format}")
2589
  if output_dir and output_format == "json":
@@ -3259,9 +3226,9 @@ Result: {result}
3259
  # Model Configuration
3260
  eval_model, eval_provider, eval_hf_inference_provider, eval_hf_token,
3261
  # Agent Configuration
3262
- eval_agent_type, eval_search_provider, eval_enable_tools, eval_prompt_yml, eval_mcp_server_url, eval_additional_imports,
3263
  # Test Configuration
3264
- eval_dataset_name, eval_split, eval_difficulty, eval_parallel_workers, eval_working_directory,
3265
  # Output & Monitoring
3266
  eval_output_format, eval_output_dir, eval_enable_otel, eval_enable_gpu_metrics, eval_private, eval_debug, eval_quiet, eval_run_id
3267
  ],
 
2292
  info="Select additional tools to enable for the agent"
2293
  )
2294
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2295
  # Section 4: Test Configuration
2296
  with gr.Accordion("🧪 Test Configuration", open=True):
2297
  gr.Markdown("*Configure test dataset and execution parameters*")
 
2325
  maximum=10
2326
  )
2327
 
 
 
 
 
 
 
2328
  # Section 5: Output & Monitoring Configuration
2329
  with gr.Accordion("📊 Output & Monitoring", open=True):
2330
  gr.Markdown("*Configure output format and monitoring options*")
 
2513
  # Model Configuration
2514
  model, provider, hf_inference_provider, hf_token,
2515
  # Agent Configuration
2516
+ agent_type, search_provider, enable_tools,
2517
  # Test Configuration
2518
+ dataset_name, split, difficulty, parallel_workers,
2519
  # Output & Monitoring
2520
  output_format, output_dir, enable_otel, enable_gpu_metrics, private, debug, quiet, run_id
2521
  ):
 
2544
  cli_command_parts.append("--hf-token $HF_TOKEN")
2545
 
2546
  cli_command_parts.append(f"--agent-type {agent_type}")
 
 
 
 
 
 
2547
 
2548
  cli_command_parts.append(f"--dataset-name {dataset_name}")
2549
  cli_command_parts.append(f"--split {split}")
 
2551
  cli_command_parts.append(f"--difficulty {difficulty}")
2552
  if parallel_workers > 1:
2553
  cli_command_parts.append(f"--parallel-workers {parallel_workers}")
 
 
2554
 
2555
  cli_command_parts.append(f"--output-format {output_format}")
2556
  if output_dir and output_format == "json":
 
3226
  # Model Configuration
3227
  eval_model, eval_provider, eval_hf_inference_provider, eval_hf_token,
3228
  # Agent Configuration
3229
+ eval_agent_type, eval_search_provider, eval_enable_tools,
3230
  # Test Configuration
3231
+ eval_dataset_name, eval_split, eval_difficulty, eval_parallel_workers,
3232
  # Output & Monitoring
3233
  eval_output_format, eval_output_dir, eval_enable_otel, eval_enable_gpu_metrics, eval_private, eval_debug, eval_quiet, eval_run_id
3234
  ],