prime-rl/src/prime_rl/configs/shared.py at 4ba36d1ac72b60588e5f2160e751301c0eb1a4ee · PrimeIntellect-ai/prime-rl · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
from pathlib import Path
from typing import Annotated, Literal, TypeAlias

from pydantic import BaseModel, Field, model_validator

from prime_rl.utils.config import BaseConfig


class SlurmConfig(BaseConfig):
    """Configures SLURM scheduling."""

    job_name: Annotated[str, Field(description="The SLURM job name.")] = "prime-rl"

    project_dir: Annotated[
        Path,
        Field(description="Path to the project root. Used to source .env, activate .venv, and run uv sync."),
    ] = Path(".")

    template_path: Annotated[
        Path | None,
        Field(
            description="The path to the SLURM template file. If None, will use the default single-node/multi-node template."
        ),
    ] = None

    partition: Annotated[
        str, Field(description="The SLURM partition to use. Will be passed as #SBATCH --partition.")
    ] = "cluster"

    @model_validator(mode="after")
    def resolve_project_dir(self):
        self.project_dir = self.project_dir.resolve()
        return self


ServerType = Literal["vllm", "openai"]


class BaseModelConfig(BaseConfig):
    """Configures the model."""

    name: Annotated[str, Field(description="Name or path of the HF model to use.")] = "Qwen/Qwen3-0.6B"

    trust_remote_code: Annotated[
        bool,
        Field(
            description="Whether to trust remote code for tokenizer initialization.",
        ),
    ] = False


class ElasticConfig(BaseConfig):
    """Configures elastic inference pool with DNS-based service discovery.

    Works with any DNS hostname that resolves to multiple IP addresses.
    """

    hostname: Annotated[
        str,
        Field(
            description="DNS hostname that resolves to inference server IPs.",
        ),
    ]

    port: Annotated[
        int,
        Field(
            description="Port that inference servers listen on.",
        ),
    ] = 8000

    sync_interval: Annotated[
        float,
        Field(
            description="Interval in seconds between server discovery checks.",
        ),
    ] = 5.0


class ClientConfig(BaseConfig):
    """Configures the OAI client.

    Supports two modes:
    - Static mode (default): Uses fixed base_url list
    - Elastic mode: Uses DNS-based service discovery via hostname

    If elastic config is provided, base_url is ignored and servers are discovered dynamically.
    """

    timeout: Annotated[
        int,
        Field(
            description="Timeout in seconds. By default, it is set to 1200 seconds.",
        ),
    ] = 1200

    base_url: Annotated[
        list[str],
        Field(
            description="Base URLs to use for the OpenAI API. By default, it is set to a single server on localhost at port 8000 which matches the default local vLLM server configuration. If you specify more than one URL, the client will round-robin (chat) completion requests across all servers. Ignored if elastic config is provided.",
        ),
    ] = ["http://localhost:8000/v1"]

    api_key_var: Annotated[
        str,
        Field(
            description="Name of environment variable containing the API key to use for the inference API. Will parse using `os.getenv(client_config.api_key_var)`. Can be set to an arbitrary string if the inference server is not protected by an API key. If multiple URLs are specified, the same API key will be used for all servers.",
        ),
    ] = "VLLM_API_KEY"

    headers: Annotated[
        dict[str, str],
        Field(
            description="Headers to use for the OpenAI API. By default, it is set to an empty dictionary.",
        ),
    ] = {}

    skip_model_check: Annotated[
        bool,
        Field(
            description="Whether to skip checking if the model is available in the inference pool. Useful for external APIs or API Keys that don't support the /models endpoint.",
        ),
    ] = False

    elastic: Annotated[
        ElasticConfig | None,
        Field(
            description="Elastic inference pool configuration for DNS-based service discovery. If provided, base_url is ignored and inference servers are discovered dynamically via DNS.",
        ),
    ] = None

    @property
    def is_elastic(self) -> bool:
        """Check if elastic mode is enabled."""
        return self.elastic is not None


class LogConfig(BaseConfig):
    """Configures the logger."""

    level: Annotated[
        str,
        Field(description="Logging level for the process. Will determine the logging verbosity and format."),
    ] = "info"

    vf_level: Annotated[
        str,
        Field(description="Logging level for the verifiers package. Will determine the logging verbosity and format."),
    ] = "info"

    file: Annotated[
        bool,
        Field(
            description="Whether to log to a file. If True, will log to a file in the output directory.",
        ),
    ] = True

    env_worker_logs: Annotated[
        bool,
        Field(
            description="Whether env workers log to files. If True, workers write to logs/env_workers/{env_name}.log.",
        ),
    ] = False

    log_data: Annotated[
        bool,
        Field(
            description="Whether to log the first data sample to the logger.",
        ),
    ] = False

    json_logging: Annotated[
        bool,
        Field(
            description="Emit JSON logs (newline-delimited) for log aggregation (Loki, Grafana, etc.).",
        ),
    ] = False


class LogExtrasConfig(BaseConfig):
    """Configures extra logging for monitoring platforms."""

    samples: Annotated[
        bool,
        Field(
            description="Whether to log prompt/response samples.",
        ),
    ] = True

    distributions: Annotated[
        bool,
        Field(
            description="Whether to log distributions (like rewards, advantages, etc.).",
        ),
    ] = True

    interval: Annotated[
        int,
        Field(
            ge=1,
            description="Step interval at which to log extras.",
        ),
    ] = 10


class WandbConfig(BaseConfig):
    """Configures logging to Weights and Biases."""

    # Shared configs (May be overwritten by WandbConfig from `rl.py`)
    project: Annotated[str, Field(description="The W&B project to log to.")] = "prime-rl"

    name: Annotated[
        str | None,
        Field(
            description="The W&B name to to use for logging.",
        ),
    ] = None

    offline: Annotated[bool, Field(description="Whether to run W&B in offline mode.")] = False

    # Individual configs (can only be specified on trainer or orchestrator)
    id: Annotated[
        str | None,
        Field(
            description="The W&B run ID to log to. If None, a random ID will be generated. If you want to resume a run, you can set the ID to the run ID you want to resume.",
        ),
    ] = None


class WandbWithExtrasConfig(WandbConfig):
    """Configures logging to Weights and Biases with extras."""

    log_extras: Annotated[
        LogExtrasConfig | None,
        Field(
            description="Configuration for logging extras. If None, no extras are logged.",
        ),
    ] = LogExtrasConfig()


class PrimeMonitorConfig(BaseConfig):
    """Configures logging to Prime Intellect API."""

    base_url: Annotated[
        str,
        Field(
            description="The base URL for Prime Intellect monitoring API.",
        ),
    ] = "https://api.primeintellect.ai/api/internal/rft"

    api_key_var: Annotated[
        str,
        Field(
            description="Name of environment variable containing the API key for Prime Intellect API. Will parse using `os.getenv(config.api_key_var)`.",
        ),
    ] = "PRIME_API_KEY"

    log_extras: Annotated[
        LogExtrasConfig | None,
        Field(
            description="Configuration for logging extras. If None, no extras are logged.",
        ),
    ] = LogExtrasConfig()


class HeartbeatConfig(BaseConfig):
    """Configures the heartbeat for BetterStack."""

    url: Annotated[str, Field(description="The URL to send the heartbeat to.")]


class MetricsServerConfig(BaseConfig):
    """Configures the Prometheus metrics server for trainer observability."""

    port: Annotated[
        int,
        Field(
            ge=1,
            le=65535,
            description="Port to expose metrics and health endpoints. Defaults to 8000.",
        ),
    ] = 8000

    host: Annotated[
        str,
        Field(
            description="Host to bind the server to. Defaults to 0.0.0.0.",
        ),
    ] = "0.0.0.0"


class BaseTransportConfig(BaseModel):
    """Base configuration for transport."""

    pass


class FileSystemTransportConfig(BaseTransportConfig):
    """Configures filesystem-based transport for training examples."""

    type: Literal["filesystem"] = "filesystem"


class ZMQTransportConfig(BaseTransportConfig):
    """Configures ZMQ-based transport for training examples."""

    type: Literal["zmq"] = "zmq"
    host: Annotated[str, Field(description="The host address for ZMQ transport.")] = "localhost"
    port: Annotated[int, Field(description="The base port for ZMQ transport.")] = 5555
    hwm: Annotated[int, Field(description="High water mark (max messages in queue) for ZMQ sockets.")] = 10


TransportConfig: TypeAlias = Annotated[FileSystemTransportConfig | ZMQTransportConfig, Field(discriminator="type")]