Skip to content

Commit 5197f48

Browse files
committed
simplify
1 parent b559bb7 commit 5197f48

File tree

2 files changed

+3
-28
lines changed

2 files changed

+3
-28
lines changed

resources_servers/verifiers/schemas.py

Lines changed: 1 addition & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222
BaseVerifyRequest,
2323
BaseVerifyResponse,
2424
)
25-
from nemo_gym.openai_utils import NeMoGymResponse, NeMoGymResponseCreateParamsNonStreaming, NeMoGymResponseOutputItem
25+
from nemo_gym.openai_utils import NeMoGymResponse, NeMoGymResponseCreateParamsNonStreaming
2626

2727

2828
class VerifiersResourcesServerConfig(BaseResourcesServerConfig):
@@ -66,27 +66,6 @@ class VerifiersCloseResponse(BaseModel):
6666
success: bool
6767

6868

69-
class VerifiersAgentConfig(BaseModel):
70-
model_config = ConfigDict(extra="allow")
71-
72-
vf_env_id: str = Field(description="Default verifiers environment ID")
73-
vf_env_args: dict = Field(default_factory=dict, description="Default environment arguments")
74-
dataset_n: int = Field(default=-1, description="Number of examples to load")
75-
dataset_seed: int | None = Field(default=None, description="Seed for dataset shuffling")
76-
group_size: int = Field(default=1, description="Number of rollouts per example")
77-
max_concurrent_generation: int = Field(default=-1, description="Max concurrent generation")
78-
max_concurrent_scoring: int = Field(default=-1, description="Max concurrent scoring")
79-
80-
81-
class VerifiersAgentRunRequest(BaseModel):
82-
model_config = ConfigDict(extra="allow")
83-
84-
task_idx: int = Field(description="Index of the example to run")
85-
responses_create_params: NeMoGymResponseCreateParamsNonStreaming = Field(
86-
default_factory=lambda: NeMoGymResponseCreateParamsNonStreaming(input=[])
87-
)
88-
89-
9069
class VerifiersNeMoGymResponse(NeMoGymResponse):
9170
env_id: str
9271
group_id: str

responses_api_agents/verifiers_agent/app.py

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -12,8 +12,8 @@
1212
# See the License for the specific language governing permissions and
1313
# limitations under the License.
1414
import logging
15-
import sys
1615
import traceback
16+
import uuid
1717
from typing import Any
1818

1919
import aiohttp
@@ -34,7 +34,6 @@
3434
VerifiersAgentVerifyRequest,
3535
VerifiersAgentVerifyResponse,
3636
VerifiersNeMoGymResponse,
37-
VerifiersSeedSessionResponse,
3837
)
3938

4039

@@ -71,7 +70,6 @@ async def create(self, *args: Any, **kwargs: Any) -> ChatCompletion:
7170
choice_dict = response_dict["choices"][0]
7271
message_dict = choice_dict.get("message", {})
7372

74-
7573
prompt_token_ids = message_dict.pop("prompt_token_ids", [])
7674
generation_token_ids = message_dict.pop("generation_token_ids", [])
7775
generation_log_probs = message_dict.pop("generation_log_probs", [])
@@ -164,7 +162,6 @@ async def _ensure_env_loaded(self, vf_env_id: str) -> tuple[vf.Environment, str,
164162
if vf_env_id in _ENVS_CACHE:
165163
return _ENVS_CACHE[vf_env_id], _ENV_IDS_CACHE[vf_env_id], _DATASET_ROWS_CACHE[vf_env_id]
166164

167-
import uuid
168165
env_id = f"{vf_env_id}-{uuid.uuid4().hex[:8]}"
169166
logger.info(f"Loading verifiers environment: {vf_env_id}")
170167

@@ -226,9 +223,8 @@ def _convert_trajectory_to_output(self, state: dict) -> list:
226223
from nemo_gym.openai_utils import (
227224
NeMoGymEasyInputMessage,
228225
NeMoGymResponseOutputMessage,
229-
NeMoGymResponseOutputText,
230-
NeMoGymEasyInputMessageForTraining,
231226
NeMoGymResponseOutputMessageForTraining,
227+
NeMoGymResponseOutputText,
232228
)
233229

234230
output = []

0 commit comments

Comments
 (0)