mert-cemri
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎examples/alphaevolve_math_problems/circle_packing_rect/config_azure_gpt.yaml‎
Lines changed: 90 additions & 0 deletions b/‎examples/alphaevolve_math_problems/circle_packing_rect/config_azure_gpt.yaml‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎examples/alphaevolve_math_problems/circle_packing_rect/config_gemini.yaml‎
Lines changed: 90 additions & 0 deletions b/‎examples/alphaevolve_math_problems/circle_packing_rect/config_gemini.yaml‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎examples/alphaevolve_math_problems/erdos_min_overlap/config_azure_gpt.yaml‎
Lines changed: 88 additions & 0 deletions b/‎examples/alphaevolve_math_problems/erdos_min_overlap/config_azure_gpt.yaml‎
Lines changed: 88 additions & 0 deletions
diff --git a/‎examples/alphaevolve_math_problems/erdos_min_overlap/config_gemini.yaml‎
Lines changed: 88 additions & 0 deletions b/‎examples/alphaevolve_math_problems/erdos_min_overlap/config_gemini.yaml‎
Lines changed: 88 additions & 0 deletions
@@ -65,3 +65,6 @@ problems
 
 # NFS temp files
 .nfs*
+
+# Shell scripts with API keys
+examples/alphaevolve_math_problems/run_*.sh
@@ -0,0 +1,90 @@
+# Evolution settings
+max_iterations: 100
+checkpoint_interval: 10
+log_level: "INFO"
+
+# LLM configuration (Azure OpenAI)
+llm:
+  primary_model: "gpt-5"
+  api_base: "https://east-docetl.openai.azure.com/openai/deployments/gpt-4.1?api-version=2024-12-01-preview"
+  api_key: "${OPENAI_API_KEY}"
+  primary_model_weight: 1.0
+  temperature: 0.7
+  max_tokens: 32000
+  timeout: 600
+
+# Database configuration (MAP-Elites algorithm)
+database:
+  population_size: 40
+  num_islands: 5
+  migration_interval: 40
+  feature_dimensions:
+    - "score"
+    - "complexity"
+
+  # Adaptive exploration settings
+  use_adaptive_search: true
+  adaptive_window_size: 20
+  adaptive_min_exploration: 0.1
+  adaptive_max_exploration: 0.7
+
+  # Softmax sampling for exploitation
+  exploitation_temperature: 1.0
+
+  # Stagnation detection and multi-child generation
+  stagnation_threshold: 10
+  stagnation_multi_child_count: 3
+  sibling_context_limit: 5
+
+  # ============================================
+  # AutoEvolve Advanced Features (Sky Lab UC Berkeley)
+  # ============================================
+  
+  # Paradigm Breakthrough
+  enable_paradigm_breakthrough: true
+  stagnation_window: 5
+  stagnation_improvement_threshold: 0.01
+  stagnation_paradigm_samples: 3
+  paradigm_model: "gpt-5-mini"
+  paradigm_api_base: "https://east-docetl.openai.azure.com/openai/deployments/gpt-4.1?api-version=2024-12-01-preview"
+  paradigm_api_key: "${OPENAI_API_KEY}"
+
+  # Error Retry
+  enable_error_retry: true
+  max_error_retries: 2
+
+evaluator:
+  timeout: 360
+  max_retries: 3
+
+# Prompt configuration
+prompt:
+  system_message: |
+    SETTING:
+    You are an expert computational geometer and optimization specialist with deep expertise in circle packing problems, geometric optimization algorithms, and constraint satisfaction.
+    Your mission is to evolve and optimize a constructor function that generates an optimal arrangement of exactly 21 non-overlapping circles within a rectangle, maximizing the sum of their radii.
+
+    PROBLEM CONTEXT:
+    - **Objective**: Create a function that returns optimal (x, y, radius) coordinates for 21 circles
+    - **Benchmark**: Beat the AlphaEvolve state-of-the-art result of sum_radii = 2.3658321334167627
+    - **Container**: Rectangle with perimeter = 4 (width + height = 2). You may choose optimal width/height ratio
+    - **Constraints**: 
+      * All circles must be fully contained within rectangle boundaries
+      * No circle overlaps (distance between centers ≥ sum of their radii)
+      * Exactly 21 circles required
+      * All radii must be positive
+
+    PERFORMANCE METRICS:
+    1. **sum_radii**: Total sum of all 21 circle radii (PRIMARY OBJECTIVE - maximize)
+    2. **combined_score**: sum_radii / 2.3658321334167627 (progress toward beating benchmark)  
+    3. **eval_time**: Execution time in seconds (keep reasonable, prefer accuracy over speed)
+
+    TECHNICAL REQUIREMENTS:
+    - **Determinism**: Use fixed random seeds if employing stochastic methods for reproducibility
+    - **Error handling**: Graceful handling of optimization failures or infeasible configurations
+    - **Memory efficiency**: Avoid excessive memory allocation for distance matrix computations
+    - **Scalability**: Design with potential extension to different circle counts in mind
+      
+  num_top_programs: 3
+  num_diverse_programs: 2
+
@@ -0,0 +1,90 @@
+# Evolution settings
+max_iterations: 100
+checkpoint_interval: 10
+log_level: "INFO"
+
+# LLM configuration (Gemini)
+llm:
+  primary_model: "gemini-3-pro-preview"
+  api_base: "https://generativelanguage.googleapis.com/v1beta/openai/"
+  api_key: "${OPENAI_API_KEY}"
+  primary_model_weight: 1.0
+  temperature: 0.7
+  max_tokens: 32000
+  timeout: 600
+
+# Database configuration (MAP-Elites algorithm)
+database:
+  population_size: 40
+  num_islands: 5
+  migration_interval: 40
+  feature_dimensions:
+    - "score"
+    - "complexity"
+
+  # Adaptive exploration settings
+  use_adaptive_search: true
+  adaptive_window_size: 20
+  adaptive_min_exploration: 0.1
+  adaptive_max_exploration: 0.7
+
+  # Softmax sampling for exploitation
+  exploitation_temperature: 1.0
+
+  # Stagnation detection and multi-child generation
+  stagnation_threshold: 10
+  stagnation_multi_child_count: 3
+  sibling_context_limit: 5
+
+  # ============================================
+  # AutoEvolve Advanced Features (Sky Lab UC Berkeley)
+  # ============================================
+  
+  # Paradigm Breakthrough
+  enable_paradigm_breakthrough: true
+  stagnation_window: 5
+  stagnation_improvement_threshold: 0.01
+  stagnation_paradigm_samples: 3
+  paradigm_model: "gpt-5-mini"
+  paradigm_api_base: "https://east-docetl.openai.azure.com/openai/deployments/gpt-4.1?api-version=2024-12-01-preview"
+  paradigm_api_key: "${PARADIGM_API_KEY}"
+
+  # Error Retry
+  enable_error_retry: true
+  max_error_retries: 2
+
+evaluator:
+  timeout: 360
+  max_retries: 3
+
+# Prompt configuration
+prompt:
+  system_message: |
+    SETTING:
+    You are an expert computational geometer and optimization specialist with deep expertise in circle packing problems, geometric optimization algorithms, and constraint satisfaction.
+    Your mission is to evolve and optimize a constructor function that generates an optimal arrangement of exactly 21 non-overlapping circles within a rectangle, maximizing the sum of their radii.
+
+    PROBLEM CONTEXT:
+    - **Objective**: Create a function that returns optimal (x, y, radius) coordinates for 21 circles
+    - **Benchmark**: Beat the AlphaEvolve state-of-the-art result of sum_radii = 2.3658321334167627
+    - **Container**: Rectangle with perimeter = 4 (width + height = 2). You may choose optimal width/height ratio
+    - **Constraints**: 
+      * All circles must be fully contained within rectangle boundaries
+      * No circle overlaps (distance between centers ≥ sum of their radii)
+      * Exactly 21 circles required
+      * All radii must be positive
+
+    PERFORMANCE METRICS:
+    1. **sum_radii**: Total sum of all 21 circle radii (PRIMARY OBJECTIVE - maximize)
+    2. **combined_score**: sum_radii / 2.3658321334167627 (progress toward beating benchmark)  
+    3. **eval_time**: Execution time in seconds (keep reasonable, prefer accuracy over speed)
+
+    TECHNICAL REQUIREMENTS:
+    - **Determinism**: Use fixed random seeds if employing stochastic methods for reproducibility
+    - **Error handling**: Graceful handling of optimization failures or infeasible configurations
+    - **Memory efficiency**: Avoid excessive memory allocation for distance matrix computations
+    - **Scalability**: Design with potential extension to different circle counts in mind
+      
+  num_top_programs: 3
+  num_diverse_programs: 2
+
@@ -0,0 +1,88 @@
+# Evolution settings
+max_iterations: 200
+checkpoint_interval: 10
+log_level: "INFO"
+
+# LLM configuration (Azure OpenAI)
+llm:
+  primary_model: "gpt-5"
+  api_base: "https://east-docetl.openai.azure.com/openai/deployments/gpt-4.1?api-version=2024-12-01-preview"
+  api_key: "${OPENAI_API_KEY}"
+  primary_model_weight: 1.0
+  temperature: 0.7
+  max_tokens: 32000
+  timeout: 600
+
+# Database configuration (MAP-Elites algorithm)
+database:
+  population_size: 40
+  num_islands: 5
+  migration_interval: 40
+  feature_dimensions:
+    - "score"
+    - "complexity"
+
+  # Adaptive exploration settings
+  use_adaptive_search: true
+  adaptive_window_size: 20
+  adaptive_min_exploration: 0.1
+  adaptive_max_exploration: 0.7
+
+  # Softmax sampling for exploitation
+  exploitation_temperature: 1.0
+
+  # Stagnation detection and multi-child generation
+  stagnation_threshold: 10
+  stagnation_multi_child_count: 3
+  sibling_context_limit: 5
+
+  # ============================================
+  # AutoEvolve Advanced Features (Sky Lab UC Berkeley)
+  # ============================================
+  
+  # Paradigm Breakthrough
+  enable_paradigm_breakthrough: true
+  stagnation_window: 5
+  stagnation_improvement_threshold: 0.01
+  stagnation_paradigm_samples: 3
+  paradigm_model: "gpt-5-mini"
+  paradigm_api_base: "https://east-docetl.openai.azure.com/openai/deployments/gpt-4.1?api-version=2024-12-01-preview"
+  paradigm_api_key: "${OPENAI_API_KEY}"
+
+  # Error Retry
+  enable_error_retry: true
+  max_error_retries: 2
+
+evaluator:
+  timeout: 360
+  max_retries: 3
+
+# Prompt configuration
+prompt:
+  system_message: |
+    SETTING:
+    You are an expert in harmonic analysis, numerical optimization, and AI-driven mathematical discovery.
+    Your task is to evolve and optimize a Python script to find a better **upper bound** for the Erdős minimum overlap problem constant C₅.
+    
+    PROBLEM CONTEXT:
+    Target: Find a step function h: [0, 2] → [0, 1] that **minimizes** the objective:
+    max_k ∫ h(x)(1 - h(x+k)) dx
+    
+    This minimal value provides a tight upper bound for the constant C5.
+    
+    Current best known upper bound: C5 ≤ 0.38092303510845016
+    Goal: Find a step function `h` that results in a C5 value lower than 0.38092303510845016.
+    
+    CONSTRAINTS:
+    1. The function `h` must have values in the range [0, 1].
+    2. The integral of h(x) over [0, 2] must be exactly 1.
+    
+    PERFORMANCE METRICS:
+    - c5_bound: The bound found by the program.
+    - combined_score: 0.38092303510845016 / c5_bound (The primary objective is to MAXIMIZE this value - a value > 1 means a new record).
+    - n_points: number of points used in the discretization.
+    - eval_time: evaluation time of the program.
+    
+  num_top_programs: 3
+  num_diverse_programs: 2
+
@@ -0,0 +1,88 @@
+# Evolution settings
+max_iterations: 200
+checkpoint_interval: 10
+log_level: "INFO"
+
+# LLM configuration (Gemini)
+llm:
+  primary_model: "gemini-3-pro-preview"
+  api_base: "https://generativelanguage.googleapis.com/v1beta/openai/"
+  api_key: "${OPENAI_API_KEY}"
+  primary_model_weight: 1.0
+  temperature: 0.7
+  max_tokens: 32000
+  timeout: 600
+
+# Database configuration (MAP-Elites algorithm)
+database:
+  population_size: 40
+  num_islands: 5
+  migration_interval: 40
+  feature_dimensions:
+    - "score"
+    - "complexity"
+
+  # Adaptive exploration settings
+  use_adaptive_search: true
+  adaptive_window_size: 20
+  adaptive_min_exploration: 0.1
+  adaptive_max_exploration: 0.7
+
+  # Softmax sampling for exploitation
+  exploitation_temperature: 1.0
+
+  # Stagnation detection and multi-child generation
+  stagnation_threshold: 10
+  stagnation_multi_child_count: 3
+  sibling_context_limit: 5
+
+  # ============================================
+  # AutoEvolve Advanced Features (Sky Lab UC Berkeley)
+  # ============================================
+  
+  # Paradigm Breakthrough
+  enable_paradigm_breakthrough: true
+  stagnation_window: 5
+  stagnation_improvement_threshold: 0.01
+  stagnation_paradigm_samples: 3
+  paradigm_model: "gpt-5-mini"
+  paradigm_api_base: "https://east-docetl.openai.azure.com/openai/deployments/gpt-4.1?api-version=2024-12-01-preview"
+  paradigm_api_key: "${PARADIGM_API_KEY}"
+
+  # Error Retry
+  enable_error_retry: true
+  max_error_retries: 2
+
+evaluator:
+  timeout: 360
+  max_retries: 3
+
+# Prompt configuration
+prompt:
+  system_message: |
+    SETTING:
+    You are an expert in harmonic analysis, numerical optimization, and AI-driven mathematical discovery.
+    Your task is to evolve and optimize a Python script to find a better **upper bound** for the Erdős minimum overlap problem constant C₅.
+    
+    PROBLEM CONTEXT:
+    Target: Find a step function h: [0, 2] → [0, 1] that **minimizes** the objective:
+    max_k ∫ h(x)(1 - h(x+k)) dx
+    
+    This minimal value provides a tight upper bound for the constant C5.
+    
+    Current best known upper bound: C5 ≤ 0.38092303510845016
+    Goal: Find a step function `h` that results in a C5 value lower than 0.38092303510845016.
+    
+    CONSTRAINTS:
+    1. The function `h` must have values in the range [0, 1].
+    2. The integral of h(x) over [0, 2] must be exactly 1.
+    
+    PERFORMANCE METRICS:
+    - c5_bound: The bound found by the program.
+    - combined_score: 0.38092303510845016 / c5_bound (The primary objective is to MAXIMIZE this value - a value > 1 means a new record).
+    - n_points: number of points used in the discretization.
+    - eval_time: evaluation time of the program.
+    
+  num_top_programs: 3
+  num_diverse_programs: 2
+