-
Notifications
You must be signed in to change notification settings - Fork 131
Expand file tree
/
Copy pathswebench_openhands.yaml
More file actions
54 lines (49 loc) · 1.99 KB
/
swebench_openhands.yaml
File metadata and controls
54 lines (49 loc) · 1.99 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
# SWE-bench wrapper configuration for OpenHands
swe_agents:
responses_api_agents:
swe_agents:
entrypoint: app.py
domain: coding
description: SWE-bench driven by the OpenHands agent framework.
value: Eval software engineering capabilities on SWE-bench.
# Agent framework configuration
agent_framework: openhands
agent_config: responses_api_agents/swe_agents/configs/oh_config.toml
agent_max_turns: 100
agent_framework_repo: https://github.com/sdevare-nv/nv-OpenHands.git
agent_framework_commit: 6a5d7571d5e9a5ca4586dad62da97a89f8c07084 # pragma: allowlist secret
# Container configuration
container_formatter: ???
container_folder_path: null
swebench_agent_timeout: 1800
swebench_tests_timeout: 900
apptainer_memory_limit_mb: 32768
command_exec_timeout: 300
dataset_path: ???
# Optional model server reference
model_server:
name: policy_model # openai_model
type: responses_api_models
datasets:
# Training dataset
- name: train
type: train
jsonl_fpath: responses_api_agents/swe_agents/data/swegym_for_sweagent_and_openhands.jsonl
gitlab_identifier:
dataset_name: swegym_for_sweagent_and_openhands
version: 0.0.2
artifact_fpath: swegym-converted.jsonl
license: Apache 2.0
# Validation dataset
- name: validation
type: validation
jsonl_fpath: responses_api_agents/swe_agents/data/swebench_verified_for_sweagent_and_openhands.jsonl
gitlab_identifier:
dataset_name: swebench_verified_for_sweagent_and_openhands
version: 0.0.1
artifact_fpath: swebench_verified_for_sweagent_and_openhands.jsonl
license: TBD
# Example dataset for quick testing
- name: example
type: example
jsonl_fpath: responses_api_agents/swe_agents/data/example.jsonl