Spaces:
Sleeping
Sleeping
| name: code-debug-env | |
| version: "1.0.0" | |
| description: "An OpenEnv environment where an AI agent debugs broken Python code. The agent receives buggy code and test descriptions, submits fixes, and is rewarded by the fraction of tests passing (0.0–1.0)." | |
| type: space | |
| runtime: fastapi | |
| app: "code_debug_env.server.app:app" | |
| port: 7860 | |
| tasks: | |
| - id: task_001_off_by_one | |
| difficulty: easy | |
| max_steps: 5 | |
| - id: task_002_wrong_operator | |
| difficulty: easy | |
| max_steps: 5 | |
| - id: task_003_mutable_default | |
| difficulty: medium | |
| max_steps: 7 | |
| - id: task_004_scope_bug | |
| difficulty: medium | |
| max_steps: 7 | |
| - id: task_005_binary_search | |
| difficulty: hard | |
| max_steps: 10 | |
| - id: task_006_graph_cycle | |
| difficulty: hard | |
| max_steps: 10 | |
| reward: | |
| type: deterministic | |
| range: [0.0, 1.0] | |
| formula: "tests_passed / total_tests" | |
| constraints: | |
| runtime_limit: "20 minutes" | |
| vcpu: 2 | |
| memory: "8GB" | |