@@ -258,12 +258,6 @@ def generate_rl_config_template(environment: str | None = None) -> str:
258258# num_examples = 30
259259# rollouts_per_example = 4
260260
261- # Optional: validation during training
262- # [val]
263- # num_examples = 64
264- # rollouts_per_example = 1
265- # interval = 5
266-
267261# Optional: buffer configuration for difficulty filtering
268262# [buffer]
269263# easy_threshold = 1.0
@@ -409,24 +403,6 @@ def to_api_dict(self) -> Dict[str, Any] | None:
409403 return result
410404
411405
412- class ValConfig (BaseModel ):
413- model_config = ConfigDict (extra = "forbid" )
414-
415- num_examples : int | None = None
416- rollouts_per_example : int | None = None
417- interval : int | None = None
418-
419- def to_api_dict (self ) -> Dict [str , Any ] | None :
420- result : Dict [str , Any ] = {}
421- if self .num_examples is not None :
422- result ["num_examples" ] = self .num_examples
423- if self .rollouts_per_example is not None :
424- result ["rollouts_per_example" ] = self .rollouts_per_example
425- if self .interval is not None :
426- result ["interval" ] = self .interval
427- return result if result else None
428-
429-
430406class BufferConfig (BaseModel ):
431407 model_config = ConfigDict (extra = "forbid" )
432408
@@ -602,7 +578,6 @@ class RLConfig(BaseModel):
602578 env : List [EnvConfig ] = Field (default_factory = list )
603579 sampling : SamplingConfig = Field (default_factory = SamplingConfig )
604580 eval : EvalConfig = Field (default_factory = EvalConfig )
605- val : ValConfig = Field (default_factory = ValConfig )
606581 buffer : BufferConfig = Field (default_factory = BufferConfig )
607582 wandb : WandbConfig = Field (default_factory = WandbConfig )
608583 checkpoints : CheckpointsConfig = Field (default_factory = CheckpointsConfig )
@@ -964,13 +939,6 @@ def _fetch_pricing() -> None:
964939 if cfg .eval .interval :
965940 console .print (f" Interval: { cfg .eval .interval } " )
966941
967- # Validation
968- if cfg .val .num_examples is not None :
969- console .print ("\n [cyan]Validation[/cyan]" )
970- console .print (f" Num Examples: { cfg .val .num_examples } " )
971- if cfg .val .interval :
972- console .print (f" Interval: { cfg .val .interval } " )
973-
974942 # Infrastructure
975943 if cfg .infrastructure .compute_size :
976944 console .print ("\n [cyan]Infrastructure[/cyan]" )
@@ -1096,7 +1064,6 @@ def _format(list_p: Any, eff_p: Any) -> str:
10961064 secrets = secrets if secrets else None ,
10971065 team_id = app_config .team_id ,
10981066 eval_config = cfg .eval .to_api_dict (),
1099- val_config = cfg .val .to_api_dict (),
11001067 buffer_config = cfg .buffer .to_api_dict (),
11011068 learning_rate = cfg .learning_rate ,
11021069 lora_alpha = cfg .lora_alpha ,
0 commit comments