55import sys
66import termios
77import tty
8+ from datetime import datetime , timezone
89from pathlib import Path
910from typing import Any , Dict , List , Optional , Tuple
1011
@@ -787,8 +788,8 @@ def _create_eval_set(self) -> None:
787788 "batchSize" : 10 ,
788789 "timeoutMinutes" : 20 ,
789790 "modelSettings" : [],
790- "createdAt" : "2025-01-25T00: 00:00Z" ,
791- "updatedAt" : "2025-01-25T00: 00:00Z" ,
791+ "createdAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' ) ,
792+ "updatedAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' ) ,
792793 "evaluations" : []
793794 }
794795
@@ -895,8 +896,8 @@ def _create_eval_set_interactive(self) -> None:
895896 "simulateTools" : False ,
896897 "toolsToSimulate" : [],
897898 "evalSetId" : f"eval-{ len (self .eval_sets ) + 1 } " ,
898- "createdAt" : "2025-01-25T00: 00:00Z" ,
899- "updatedAt" : "2025-01-25T00: 00:00Z"
899+ "createdAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' ) ,
900+ "updatedAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' )
900901 }
901902 evaluations .append (evaluation )
902903 test_count += 1
@@ -915,8 +916,8 @@ def _create_eval_set_interactive(self) -> None:
915916 "batchSize" : 10 ,
916917 "timeoutMinutes" : 20 ,
917918 "modelSettings" : [],
918- "createdAt" : "2025-01-25T00: 00:00Z" ,
919- "updatedAt" : "2025-01-25T00: 00:00Z" ,
919+ "createdAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' ) ,
920+ "updatedAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' ) ,
920921 "evaluations" : evaluations
921922 }
922923
@@ -986,8 +987,8 @@ def _add_evaluations_interactive(self, eval_set_id: str) -> List[Dict[str, Any]]
986987 "simulateTools" : False ,
987988 "toolsToSimulate" : [],
988989 "evalSetId" : eval_set_id ,
989- "createdAt" : "2025-01-25T00: 00:00Z" ,
990- "updatedAt" : "2025-01-25T00: 00:00Z"
990+ "createdAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' ) ,
991+ "updatedAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' )
991992 }
992993 evaluations .append (evaluation )
993994 test_count += 1
@@ -1020,8 +1021,8 @@ def _create_evaluator(self) -> None:
10201021 "category" : 0 ,
10211022 "type" : 1 ,
10221023 "targetOutputKey" : "*" ,
1023- "createdAt" : "2025-01-25T00: 00:00Z" ,
1024- "updatedAt" : "2025-01-25T00: 00:00Z"
1024+ "createdAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' ) ,
1025+ "updatedAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' )
10251026 }
10261027 else : # JSON Similarity
10271028 evaluator = {
@@ -1031,8 +1032,8 @@ def _create_evaluator(self) -> None:
10311032 "category" : 0 ,
10321033 "type" : 6 ,
10331034 "targetOutputKey" : "*" ,
1034- "createdAt" : "2025-01-25T00: 00:00Z" ,
1035- "updatedAt" : "2025-01-25T00: 00:00Z"
1035+ "createdAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' ) ,
1036+ "updatedAt" : datetime . now ( timezone . utc ). isoformat (). replace ( '+ 00:00' , 'Z' )
10361037 }
10371038
10381039 # Ensure evaluators directory exists
0 commit comments