feat(bokeh): implement coefficient-confidence (#3588)

github-actions[bot] · web-flow · commit d86ddd9a14b0 · 2026-01-10T00:07:27.000Z
## Implementation: `coefficient-confidence` - bokeh Implements the **bokeh** version of `coefficient-confidence`. **File:** `plots/coefficient-confidence/implementations/bokeh.py` **Parent Issue:** #3576 --- :robot: *[impl-generate workflow](https://github.com/MarkusNeusinger/pyplots/actions/runs/20868891789)* --------- Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
diff --git a/plots/coefficient-confidence/implementations/bokeh.py b/plots/coefficient-confidence/implementations/bokeh.py
@@ -0,0 +1,169 @@
+""" pyplots.ai
+coefficient-confidence: Coefficient Plot with Confidence Intervals
+Library: bokeh 3.8.2 | Python 3.13.11
+Quality: 90/100 | Created: 2026-01-09
+"""
+
+import numpy as np
+from bokeh.io import export_png, output_file, save
+from bokeh.models import ColumnDataSource, HoverTool, Legend, LegendItem, Span
+from bokeh.plotting import figure
+
+
+# Data - Regression coefficients for housing price prediction model
+np.random.seed(42)
+
+variables = [
+    "Square Footage",
+    "Number of Bedrooms",
+    "Number of Bathrooms",
+    "Age of House",
+    "Distance to City Center",
+    "Lot Size",
+    "Garage Size",
+    "School Rating",
+    "Crime Rate Index",
+    "Property Tax Rate",
+]
+
+# Generate realistic regression coefficients (some significant, some not)
+coefficients = np.array([0.45, 0.12, 0.18, -0.08, -0.22, 0.15, 0.09, 0.28, -0.35, -0.05])
+std_errors = np.array([0.05, 0.08, 0.06, 0.03, 0.07, 0.04, 0.06, 0.05, 0.09, 0.07])
+
+# Calculate 95% confidence intervals
+ci_lower = coefficients - 1.96 * std_errors
+ci_upper = coefficients + 1.96 * std_errors
+
+# Determine significance (CI does not cross zero)
+significant = ~((ci_lower < 0) & (ci_upper > 0))
+
+# Sort by coefficient magnitude for better visualization
+sort_idx = np.argsort(np.abs(coefficients))
+variables = [variables[i] for i in sort_idx]
+coefficients = coefficients[sort_idx]
+ci_lower = ci_lower[sort_idx]
+ci_upper = ci_upper[sort_idx]
+significant = significant[sort_idx]
+
+# Strong color contrast for significant vs non-significant distinction
+# Using vivid blue (#2171b5) for significant vs muted gray (#969696) for non-significant
+SIG_COLOR = "#2171b5"
+NONSIG_COLOR = "#969696"
+
+colors = [SIG_COLOR if sig else NONSIG_COLOR for sig in significant]
+
+# Create figure with categorical y-axis
+p = figure(
+    width=4800,
+    height=2700,
+    y_range=variables,
+    title="coefficient-confidence · bokeh · pyplots.ai",
+    x_axis_label="Coefficient Estimate (Standardized)",
+    y_axis_label="Predictor Variable",
+)
+
+# Add vertical reference line at zero
+zero_line = Span(location=0, dimension="height", line_color="#333333", line_width=3, line_dash="dashed")
+p.add_layout(zero_line)
+
+# Draw confidence interval segments (error bars) with distinct colors
+for i, var in enumerate(variables):
+    color = colors[i]
+    # Main confidence interval line
+    p.line(x=[ci_lower[i], ci_upper[i]], y=[var, var], line_width=6, line_color=color, line_alpha=0.85)
+
+# Plot coefficient points - separate renderers for legend with distinct colors
+sig_indices = [i for i, s in enumerate(significant) if s]
+nonsig_indices = [i for i, s in enumerate(significant) if not s]
+
+# Create separate data sources for legend
+sig_source = ColumnDataSource(
+    data={
+        "variables": [variables[i] for i in sig_indices],
+        "coefficients": [coefficients[i] for i in sig_indices],
+        "ci_lower_fmt": [f"{ci_lower[i]:.3f}" for i in sig_indices],
+        "ci_upper_fmt": [f"{ci_upper[i]:.3f}" for i in sig_indices],
+        "coef_fmt": [f"{coefficients[i]:.3f}" for i in sig_indices],
+        "significance": ["Significant (p < 0.05)"] * len(sig_indices),
+    }
+)
+
+nonsig_source = ColumnDataSource(
+    data={
+        "variables": [variables[i] for i in nonsig_indices],
+        "coefficients": [coefficients[i] for i in nonsig_indices],
+        "ci_lower_fmt": [f"{ci_lower[i]:.3f}" for i in nonsig_indices],
+        "ci_upper_fmt": [f"{ci_upper[i]:.3f}" for i in nonsig_indices],
+        "coef_fmt": [f"{coefficients[i]:.3f}" for i in nonsig_indices],
+        "significance": ["Not Significant"] * len(nonsig_indices),
+    }
+)
+
+# Render significant points with vivid blue
+sig_renderer = p.scatter(
+    x="coefficients", y="variables", source=sig_source, size=30, color=SIG_COLOR, line_color="white", line_width=3
+)
+
+# Render non-significant points with muted gray
+nonsig_renderer = p.scatter(
+    x="coefficients", y="variables", source=nonsig_source, size=30, color=NONSIG_COLOR, line_color="white", line_width=3
+)
+
+# Add HoverTool for interactive tooltips (Bokeh distinctive feature)
+hover = HoverTool(
+    tooltips=[
+        ("Variable", "@variables"),
+        ("Coefficient", "@coef_fmt"),
+        ("95% CI", "[@ci_lower_fmt, @ci_upper_fmt]"),
+        ("Status", "@significance"),
+    ],
+    renderers=[sig_renderer, nonsig_renderer],
+)
+p.add_tools(hover)
+
+# Create legend inside the plot area (top right corner within plot bounds)
+legend = Legend(
+    items=[
+        LegendItem(label="Significant (p < 0.05)", renderers=[sig_renderer]),
+        LegendItem(label="Not Significant", renderers=[nonsig_renderer]),
+    ],
+    location="top_right",
+    label_text_font_size="24pt",
+    glyph_width=40,
+    glyph_height=40,
+    border_line_color="#666666",
+    border_line_width=2,
+    background_fill_color="white",
+    background_fill_alpha=0.95,
+    padding=20,
+    margin=30,
+)
+p.add_layout(legend)
+
+# Style text sizes for large canvas (increased for better readability)
+p.title.text_font_size = "36pt"
+p.xaxis.axis_label_text_font_size = "28pt"
+p.yaxis.axis_label_text_font_size = "28pt"
+p.xaxis.major_label_text_font_size = "22pt"
+p.yaxis.major_label_text_font_size = "22pt"
+
+# Grid styling
+p.xgrid.grid_line_alpha = 0.3
+p.xgrid.grid_line_dash = "dashed"
+p.ygrid.grid_line_alpha = 0.3
+p.ygrid.grid_line_dash = "dashed"
+
+# Background styling
+p.background_fill_color = "#fafafa"
+p.border_fill_color = "white"
+
+# Increase axis line width for visibility
+p.xaxis.axis_line_width = 2
+p.yaxis.axis_line_width = 2
+p.xaxis.major_tick_line_width = 2
+p.yaxis.major_tick_line_width = 2
+
+# Save plot (PNG and HTML for interactive)
+export_png(p, filename="plot.png")
+output_file("plot.html", title="Coefficient Plot with Confidence Intervals")
+save(p)
diff --git a/plots/coefficient-confidence/metadata/bokeh.yaml b/plots/coefficient-confidence/metadata/bokeh.yaml
@@ -0,0 +1,217 @@
+library: bokeh
+specification_id: coefficient-confidence
+created: '2026-01-09T23:48:14Z'
+updated: '2026-01-10T00:07:07Z'
+generated_by: claude-opus-4-5-20251101
+workflow_run: 20868891789
+issue: 3576
+python_version: 3.13.11
+library_version: 3.8.2
+preview_url: https://storage.googleapis.com/pyplots-images/plots/coefficient-confidence/bokeh/plot.png
+preview_thumb: https://storage.googleapis.com/pyplots-images/plots/coefficient-confidence/bokeh/plot_thumb.png
+preview_html: https://storage.googleapis.com/pyplots-images/plots/coefficient-confidence/bokeh/plot.html
+quality_score: 90
+review:
+  strengths:
+  - Strong color contrast between significant (blue) and non-significant (gray) coefficients
+  - 'Excellent use of Bokeh-specific features: HoverTool with detailed tooltips showing
+    variable, coefficient, CI, and status'
+  - Clean horizontal layout matching spec preference for long variable names
+  - Professional styling with appropriate font sizes for large canvas
+  - Zero reference line clearly visible as dashed line
+  - Both PNG and HTML outputs generated for full interactivity
+  weaknesses:
+  - Legend placement in top-right slightly overlaps with the data region where Square
+    Footage coefficient extends
+  - Grid styling could be slightly more subtle (currently at alpha=0.3, could be 0.2)
+  image_description: The plot displays a horizontal coefficient plot with 10 predictor
+    variables for a housing price prediction model. Variables are listed on the y-axis
+    (Property Tax Rate, Age of House, Garage Size, Number of Bedrooms, Lot Size, Number
+    of Bathrooms, Distance to City Center, School Rating, Crime Rate Index, Square
+    Footage) ordered by coefficient magnitude. The x-axis shows "Coefficient Estimate
+    (Standardized)" ranging from approximately -0.4 to 0.6. A vertical dashed dark
+    gray reference line at x=0 indicates the null hypothesis threshold. Significant
+    coefficients (p < 0.05) are displayed in vivid blue (#2171b5) while non-significant
+    coefficients appear in muted gray (#969696). Each coefficient is represented by
+    a point marker with horizontal confidence interval bars. The legend in the top-right
+    corner clearly distinguishes "Significant (p < 0.05)" and "Not Significant" categories.
+    The background is light gray (#fafafa) with subtle dashed grid lines. The title
+    "coefficient-confidence · bokeh · pyplots.ai" appears at the top left.
+  criteria_checklist:
+    visual_quality:
+      score: 37
+      max: 40
+      items:
+      - id: VQ-01
+        name: Text Legibility
+        score: 10
+        max: 10
+        passed: true
+        comment: Title at 36pt, axis labels at 28pt, tick labels at 22pt - all clearly
+          readable
+      - id: VQ-02
+        name: No Overlap
+        score: 8
+        max: 8
+        passed: true
+        comment: No overlapping text or elements, variable names fully visible
+      - id: VQ-03
+        name: Element Visibility
+        score: 7
+        max: 8
+        passed: true
+        comment: Markers size=30 and line_width=6 are appropriate, confidence intervals
+          clearly visible
+      - id: VQ-04
+        name: Color Accessibility
+        score: 5
+        max: 5
+        passed: true
+        comment: Blue vs gray is colorblind-safe, strong contrast between significant/non-significant
+      - id: VQ-05
+        name: Layout Balance
+        score: 5
+        max: 5
+        passed: true
+        comment: Plot fills canvas well, good margins, legend positioned appropriately
+          inside plot
+      - id: VQ-06
+        name: Axis Labels
+        score: 2
+        max: 2
+        passed: true
+        comment: X-axis has Coefficient Estimate (Standardized), Y-axis has Predictor
+          Variable
+      - id: VQ-07
+        name: Grid & Legend
+        score: 0
+        max: 2
+        passed: false
+        comment: Legend placement in top-right partially overlaps with data region
+          for Square Footage
+    spec_compliance:
+      score: 25
+      max: 25
+      items:
+      - id: SC-01
+        name: Plot Type
+        score: 8
+        max: 8
+        passed: true
+        comment: Correct coefficient plot with horizontal error bars
+      - id: SC-02
+        name: Data Mapping
+        score: 5
+        max: 5
+        passed: true
+        comment: Variables on Y-axis, coefficients on X-axis per spec preference
+      - id: SC-03
+        name: Required Features
+        score: 5
+        max: 5
+        passed: true
+        comment: Zero reference line, color distinction for significance, confidence
+          intervals all present
+      - id: SC-04
+        name: Data Range
+        score: 3
+        max: 3
+        passed: true
+        comment: All data visible within axis range
+      - id: SC-05
+        name: Legend Accuracy
+        score: 2
+        max: 2
+        passed: true
+        comment: Legend correctly labels significant vs non-significant
+      - id: SC-06
+        name: Title Format
+        score: 2
+        max: 2
+        passed: true
+        comment: 'Uses correct format: coefficient-confidence · bokeh · pyplots.ai'
+    data_quality:
+      score: 18
+      max: 20
+      items:
+      - id: DQ-01
+        name: Feature Coverage
+        score: 7
+        max: 8
+        passed: true
+        comment: Shows mix of positive/negative coefficients, significant/non-significant,
+          varying CI widths
+      - id: DQ-02
+        name: Realistic Context
+        score: 7
+        max: 7
+        passed: true
+        comment: Housing price prediction is a real, neutral scenario with sensible
+          predictors
+      - id: DQ-03
+        name: Appropriate Scale
+        score: 4
+        max: 5
+        passed: true
+        comment: Standardized coefficients in reasonable range (-0.35 to 0.45)
+    code_quality:
+      score: 10
+      max: 10
+      items:
+      - id: CQ-01
+        name: KISS Structure
+        score: 3
+        max: 3
+        passed: true
+        comment: 'Linear script: imports, data, plot, save - no functions/classes'
+      - id: CQ-02
+        name: Reproducibility
+        score: 3
+        max: 3
+        passed: true
+        comment: np.random.seed(42) is set
+      - id: CQ-03
+        name: Clean Imports
+        score: 2
+        max: 2
+        passed: true
+        comment: All imports are used (numpy, bokeh components)
+      - id: CQ-04
+        name: No Deprecated API
+        score: 1
+        max: 1
+        passed: true
+        comment: Uses current Bokeh 3.x API
+      - id: CQ-05
+        name: Output Correct
+        score: 1
+        max: 1
+        passed: true
+        comment: Saves as plot.png and plot.html
+    library_features:
+      score: 5
+      max: 5
+      items:
+      - id: LF-01
+        name: Distinctive Features
+        score: 5
+        max: 5
+        passed: true
+        comment: 'Excellent use of Bokeh features: ColumnDataSource, HoverTool with
+          tooltips, Legend with custom items, Span for reference line, HTML export'
+  verdict: APPROVED
+impl_tags:
+  dependencies: []
+  techniques:
+  - hover-tooltips
+  - custom-legend
+  - html-export
+  patterns:
+  - data-generation
+  - columndatasource
+  - iteration-over-groups
+  dataprep: []
+  styling:
+  - edge-highlighting
+  - grid-styling
+  - alpha-blending