coding-kitties
diff --git a/‎analyze_assertion_discrepancies.py‎
Lines changed: 0 additions & 58 deletions b/‎analyze_assertion_discrepancies.py‎
Lines changed: 0 additions & 58 deletions
diff --git a/‎debug_advanced.py‎
Lines changed: 0 additions & 98 deletions b/‎debug_advanced.py‎
Lines changed: 0 additions & 98 deletions
diff --git a/‎debug_chart.py‎
Lines changed: 0 additions & 18 deletions b/‎debug_chart.py‎
Lines changed: 0 additions & 18 deletions
diff --git a/‎debug_template.py‎
Lines changed: 0 additions & 39 deletions b/‎debug_template.py‎
Lines changed: 0 additions & 39 deletions
diff --git a/‎find_discrepancies.py‎
Lines changed: 0 additions & 57 deletions b/‎find_discrepancies.py‎
Lines changed: 0 additions & 57 deletions
diff --git a/‎report/charts_and_tables.py‎
Lines changed: 113 additions & 0 deletions b/‎report/charts_and_tables.py‎
Lines changed: 113 additions & 0 deletions
@@ -1973,3 +1973,116 @@ def create_pass_fail_by_evaluation_type_chart(data):
     fig3.update_xaxes(showgrid=True, gridwidth=1, gridcolor='lightgray')
     fig3.update_yaxes(showgrid=True, gridwidth=1, gridcolor='lightgray')
     return fig3
+
+
+def create_combined_assertions_bar_chart(data: Dict[str, pd.DataFrame]) -> go.Figure:
+    """
+    Create a combined bar chart showing assertions passed, failed, and missed for all models.
+    This replaces the separate single-shot and multi-shot charts.
+
+    Args:
+        data: Dictionary of datasets
+
+    Returns:
+        Plotly Figure with combined assertions data
+    """
+    # Prepare data for plotting
+    models = []
+    assertions_passed = []
+    assertions_failed = []
+    assertions_missed = []
+
+    for key, df in data.items():
+        # Handle different naming conventions
+        if '_singleshot_' in key or '_multishot_' in key:
+            # Advanced results naming convention
+            model_name = key.split('_')[0]
+            # Add configuration info to make it unique
+            if '_rag_' in key:
+                rag_status = 'rag' if '_rag_detailed' in key or '_rag_simple' in key else 'norag'
+            else:
+                rag_status = 'norag'
+
+            instruction_type = 'detailed' if '_detailed' in key else 'simple'
+            eval_type = 'multishot' if '_multishot_' in key else 'singleshot'
+            model_name_full = f"{model_name}_{rag_status}_{instruction_type}_{eval_type}"
+        else:
+            # Exercism results naming: use existing logic
+            model_name = key.split('_multi_shot')[0]
+            is_multishot = 'multi_shot_build_error_enabled_True' in key
+            eval_type = 'multishot' if is_multishot else 'singleshot'
+            model_name_full = f"{model_name}_{eval_type}"
+
+        models.append(model_name_full)
+        total_passed = df['number_of_assertions_passed'].sum()
+        total_failed = df['number_of_assertions_failed'].sum()
+        total_missed = df['number_of_assertions_missed'].sum()
+
+        assertions_passed.append(total_passed)
+        assertions_failed.append(total_failed)
+        assertions_missed.append(total_missed)
+
+    # Create interactive bar chart
+    fig = go.Figure()
+
+    fig.add_trace(go.Bar(
+        name='Assertions Passed',
+        x=models,
+        y=assertions_passed,
+        marker_color='#28a745',  # Green
+        opacity=0.8,
+        text=assertions_passed,
+        textposition='outside',
+        hovertemplate='<b>%{x}</b><br>Assertions Passed: %{y}<extra></extra>'
+    ))
+
+    fig.add_trace(go.Bar(
+        name='Assertions Failed',
+        x=models,
+        y=assertions_failed,
+        marker_color='#dc3545',  # Red
+        opacity=0.8,
+        text=assertions_failed,
+        textposition='outside',
+        hovertemplate='<b>%{x}</b><br>Assertions Failed: %{y}<extra></extra>'
+    ))
+
+    fig.add_trace(go.Bar(
+        name='Assertions Missed',
+        x=models,
+        y=assertions_missed,
+        marker_color='#ffc107',  # Yellow/Orange
+        opacity=0.8,
+        text=assertions_missed,
+        textposition='outside',
+        hovertemplate='<b>%{x}</b><br>Assertions Missed: %{y}<br><i>(Due to build errors, etc.)</i><extra></extra>'
+    ))
+
+    fig.update_layout(
+        title={
+            'text': 'Assertions Performance by Model and Configuration',
+            'x': 0.5,
+            'xanchor': 'center',
+            'font': {'size': 18}
+        },
+        xaxis_title='Models and Configurations',
+        yaxis_title='Number of Assertions',
+        barmode='group',
+        width=1200,
+        height=700,
+        template='plotly_white',
+        legend=dict(
+            orientation="h",
+            yanchor="bottom",
+            y=1.02,
+            xanchor="right",
+            x=1
+        ),
+        margin=dict(b=150, l=80, r=80, t=100)
+    )
+
+    fig.update_xaxes(tickangle=45, tickfont=dict(size=10))
+    fig.update_yaxes(showgrid=True, gridwidth=1, gridcolor='lightgray')
+
+    return fig
+