feat(plotnine): implement boxen-basic (#3434)

github-actions[bot] · web-flow · commit 346bd4f7445e · 2026-01-09T08:15:48.000Z
## Implementation: `boxen-basic` - plotnine Implements the **plotnine** version of `boxen-basic`. **File:** `plots/boxen-basic/implementations/plotnine.py` **Parent Issue:** #3414 --- :robot: *[impl-generate workflow](https://github.com/MarkusNeusinger/pyplots/actions/runs/20845375761)* --------- Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
diff --git a/plots/boxen-basic/implementations/plotnine.py b/plots/boxen-basic/implementations/plotnine.py
@@ -0,0 +1,175 @@
+""" pyplots.ai
+boxen-basic: Basic Boxen Plot (Letter-Value Plot)
+Library: plotnine 0.15.2 | Python 3.13.11
+Quality: 91/100 | Created: 2026-01-09
+"""
+
+import numpy as np
+import pandas as pd
+from plotnine import (
+    aes,
+    element_line,
+    element_text,
+    geom_point,
+    geom_rect,
+    geom_segment,
+    ggplot,
+    labs,
+    scale_fill_manual,
+    scale_x_continuous,
+    theme,
+    theme_minimal,
+)
+
+
+# Set seed for reproducibility
+np.random.seed(42)
+
+# Generate data - server response times by endpoint (1000+ per category)
+n_per_group = 2000
+endpoints = ["API", "Database", "Cache", "Auth"]
+
+data = []
+for endpoint in endpoints:
+    if endpoint == "API":
+        # Right-skewed with some outliers
+        values = np.concatenate(
+            [
+                np.random.exponential(50, n_per_group - 20),
+                np.random.uniform(300, 500, 20),  # Outliers
+            ]
+        )
+    elif endpoint == "Database":
+        # Bimodal - some fast, some slow queries
+        values = np.concatenate(
+            [np.random.normal(30, 10, n_per_group // 2), np.random.normal(100, 20, n_per_group // 2)]
+        )
+    elif endpoint == "Cache":
+        # Fast and tight distribution
+        values = np.random.normal(15, 5, n_per_group)
+        values = np.maximum(values, 1)  # No negative response times
+    else:  # Auth
+        # Medium with heavy tail
+        values = np.random.gamma(3, 20, n_per_group)
+
+    for v in values:
+        data.append({"endpoint": endpoint, "response_time": v})
+
+df = pd.DataFrame(data)
+
+
+# Compute letter values for each group
+categories = df["endpoint"].unique()
+box_data = []
+outlier_data = []
+median_data = []
+
+# Width parameters
+base_width = 0.8
+width_decay = 0.85  # Each nested level is 85% of previous width
+
+for i, cat in enumerate(categories):
+    values = df[df["endpoint"] == cat]["response_time"].values
+
+    # Calculate letter values (quantiles) inline
+    n = len(values)
+    k = min(max(3, int(np.floor(np.log2(n)) - 2)), 8)  # Adaptive levels, cap at 8
+
+    # Compute quantile depths
+    depths = [0.5]  # Start with median
+    for j in range(1, k):
+        depth = 0.5 ** (j + 1)
+        depths.append(0.5 - depth)
+        depths.append(0.5 + depth)
+
+    depths = sorted(set(depths))
+    quantiles = np.quantile(values, depths)
+
+    # Find median
+    median_idx = depths.index(0.5)
+    median_val = quantiles[median_idx]
+    median_data.append({"x": i, "y": median_val, "endpoint": cat})
+
+    # Create nested boxes from outer to inner
+    n_pairs = (len(depths) - 1) // 2
+    for level in range(n_pairs):
+        lower_idx = level
+        upper_idx = len(depths) - 1 - level
+        ymin = quantiles[lower_idx]
+        ymax = quantiles[upper_idx]
+        width = base_width * (width_decay**level)
+
+        box_data.append(
+            {
+                "endpoint": cat,
+                "x": i,
+                "xmin": i - width / 2,
+                "xmax": i + width / 2,
+                "ymin": ymin,
+                "ymax": ymax,
+                "level": level,
+            }
+        )
+
+    # Outliers beyond deepest letter value
+    lower_bound = quantiles[0]
+    upper_bound = quantiles[-1]
+    outliers = values[(values < lower_bound) | (values > upper_bound)]
+    for o in outliers:
+        outlier_data.append({"x": i, "y": o, "endpoint": cat})
+
+box_df = pd.DataFrame(box_data)
+outlier_df = pd.DataFrame(outlier_data) if outlier_data else pd.DataFrame(columns=["x", "y", "endpoint"])
+median_df = pd.DataFrame(median_data)
+
+# Color palette - Python Blue gradient from dark to light
+n_levels = box_df["level"].max() + 1 if len(box_df) > 0 else 1
+# Create gradient from dark blue (#1a4971) to light blue (#a8d4f0)
+colors = []
+for i in range(n_levels):
+    t = i / max(n_levels - 1, 1)  # Normalize to 0-1
+    r = int(26 + t * (168 - 26))
+    g = int(73 + t * (212 - 73))
+    b = int(113 + t * (240 - 113))
+    colors.append(f"#{r:02x}{g:02x}{b:02x}")
+
+# Create the plot
+plot = (
+    ggplot()
+    + geom_rect(
+        data=box_df.sort_values("level", ascending=False),  # Draw outer boxes first
+        mapping=aes(xmin="xmin", xmax="xmax", ymin="ymin", ymax="ymax", fill="factor(level)"),
+        color="#1a1a1a",
+        size=0.3,
+    )
+    + geom_segment(data=median_df, mapping=aes(x="x - 0.35", xend="x + 0.35", y="y", yend="y"), color="white", size=1.5)
+    + scale_fill_manual(
+        values=colors,
+        name="Quantile Level",
+        labels=[f"{50 * (0.5 ** (i + 1)):.1f}%-{100 - 50 * (0.5 ** (i + 1)):.1f}%" for i in range(n_levels)],
+    )
+    + labs(title="boxen-basic · plotnine · pyplots.ai", x="Endpoint", y="Response Time (ms)")
+    + theme_minimal()
+    + theme(
+        figure_size=(16, 9),
+        plot_title=element_text(size=24, weight="bold"),
+        axis_title=element_text(size=20),
+        axis_text=element_text(size=16),
+        axis_text_x=element_text(size=18),
+        legend_title=element_text(size=16),
+        legend_text=element_text(size=14),
+        legend_position="right",
+        panel_grid_major=element_line(alpha=0.3),
+        panel_grid_minor=element_line(alpha=0.15),
+    )
+)
+
+# Add outliers if present
+if len(outlier_df) > 0:
+    plot = plot + geom_point(data=outlier_df, mapping=aes(x="x", y="y"), color="#306998", size=2, alpha=0.5)
+
+# Custom x-axis scale for category names
+plot = plot + scale_x_continuous(breaks=list(range(len(categories))), labels=list(categories))
+
+# Save the plot
+plot.save("plot.png", dpi=300, width=16, height=9)
diff --git a/plots/boxen-basic/metadata/plotnine.yaml b/plots/boxen-basic/metadata/plotnine.yaml
@@ -0,0 +1,215 @@
+library: plotnine
+specification_id: boxen-basic
+created: '2026-01-09T08:10:09Z'
+updated: '2026-01-09T08:15:18Z'
+generated_by: claude-opus-4-5-20251101
+workflow_run: 20845375761
+issue: 3414
+python_version: 3.13.11
+library_version: 0.15.2
+preview_url: https://storage.googleapis.com/pyplots-images/plots/boxen-basic/plotnine/plot.png
+preview_thumb: https://storage.googleapis.com/pyplots-images/plots/boxen-basic/plotnine/plot_thumb.png
+preview_html: null
+quality_score: 91
+review:
+  strengths:
+  - Excellent implementation of a boxen plot using plotnine grammar of graphics despite
+    lacking native geom_boxen support
+  - 'Data demonstrates all key aspects of boxen plots: different distribution shapes,
+    visible quantile nesting, and outlier detection'
+  - Clean blue gradient color scheme that is colorblind-safe
+  - Realistic server response time scenario with 2000 points per category
+  - Proper use of nested boxes with decreasing widths for deeper quantiles
+  - Clear legend explaining quantile level percentages
+  weaknesses:
+  - Color gradient between quantile levels could have more contrast to better distinguish
+    nested boxes
+  - Manual implementation adds code complexity (though unavoidable for plotnine)
+  image_description: 'The plot displays a boxen plot (letter-value plot) showing server
+    response times across four endpoints: API, Database, Cache, and Auth. Each category
+    has nested rectangular boxes representing different quantile levels, colored in
+    a gradient from dark blue (innermost, representing 25%-75%) to light blue (outermost,
+    representing 0.4%-99.6%). The boxes decrease in width for deeper quantiles as
+    expected. A white horizontal line marks the median in each box. Outliers are shown
+    as semi-transparent blue points above the main boxes, particularly visible for
+    the API endpoint (ranging up to ~500ms) and to a lesser extent for Database and
+    Auth. The Cache endpoint shows a tight, low distribution with few outliers. The
+    x-axis is labeled "Endpoint" with category names (API, Database, Cache, Auth),
+    and the y-axis is labeled "Response Time (ms)" ranging from 0 to about 500. A
+    legend on the right explains the quantile levels. The title follows the required
+    format: "boxen-basic · plotnine · pyplots.ai". Grid lines are subtle and the overall
+    layout is well-balanced.'
+  criteria_checklist:
+    visual_quality:
+      score: 38
+      max: 40
+      items:
+      - id: VQ-01
+        name: Text Legibility
+        score: 10
+        max: 10
+        passed: true
+        comment: Title at 24pt bold, axis labels at 20pt, tick labels at 16-18pt,
+          all perfectly readable
+      - id: VQ-02
+        name: No Overlap
+        score: 8
+        max: 8
+        passed: true
+        comment: No overlapping text elements, category labels well-spaced
+      - id: VQ-03
+        name: Element Visibility
+        score: 7
+        max: 8
+        passed: true
+        comment: Nested boxes clearly visible with distinct widths; outlier points
+          appropriately sized with alpha=0.5
+      - id: VQ-04
+        name: Color Accessibility
+        score: 5
+        max: 5
+        passed: true
+        comment: Blue gradient is colorblind-safe, good contrast between levels
+      - id: VQ-05
+        name: Layout Balance
+        score: 5
+        max: 5
+        passed: true
+        comment: Plot fills good portion of canvas, balanced margins
+      - id: VQ-06
+        name: Axis Labels
+        score: 2
+        max: 2
+        passed: true
+        comment: 'Descriptive labels with units: Response Time (ms) and Endpoint'
+      - id: VQ-07
+        name: Grid & Legend
+        score: 1
+        max: 2
+        passed: true
+        comment: Grid subtle (alpha 0.3), legend placed well but has many entries
+    spec_compliance:
+      score: 23
+      max: 25
+      items:
+      - id: SC-01
+        name: Plot Type
+        score: 8
+        max: 8
+        passed: true
+        comment: Correct boxen/letter-value plot with nested boxes showing multiple
+          quantile levels
+      - id: SC-02
+        name: Data Mapping
+        score: 5
+        max: 5
+        passed: true
+        comment: Categories on X-axis, values on Y-axis correctly assigned
+      - id: SC-03
+        name: Required Features
+        score: 4
+        max: 5
+        passed: true
+        comment: Shows nested boxes with decreasing widths, outliers displayed; color
+          distinction between levels is subtle
+      - id: SC-04
+        name: Data Range
+        score: 3
+        max: 3
+        passed: true
+        comment: All data visible including outliers up to ~500ms
+      - id: SC-05
+        name: Legend Accuracy
+        score: 2
+        max: 2
+        passed: true
+        comment: Legend correctly explains quantile levels with percentage ranges
+      - id: SC-06
+        name: Title Format
+        score: 1
+        max: 2
+        passed: true
+        comment: Correct format but uses standard separator
+    data_quality:
+      score: 19
+      max: 20
+      items:
+      - id: DQ-01
+        name: Feature Coverage
+        score: 8
+        max: 8
+        passed: true
+        comment: 'Excellent: shows different distribution shapes (API skewed, Database
+          bimodal, Cache tight, Auth gamma)'
+      - id: DQ-02
+        name: Realistic Context
+        score: 7
+        max: 7
+        passed: true
+        comment: Server response times by endpoint is a perfect, realistic scenario
+      - id: DQ-03
+        name: Appropriate Scale
+        score: 4
+        max: 5
+        passed: true
+        comment: Response times 0-500ms are realistic for server endpoints
+    code_quality:
+      score: 8
+      max: 10
+      items:
+      - id: CQ-01
+        name: KISS Structure
+        score: 2
+        max: 3
+        passed: true
+        comment: Code follows pattern but has complexity for manual letter-value calculation
+          (unavoidable)
+      - id: CQ-02
+        name: Reproducibility
+        score: 3
+        max: 3
+        passed: true
+        comment: np.random.seed(42) set at beginning
+      - id: CQ-03
+        name: Clean Imports
+        score: 2
+        max: 2
+        passed: true
+        comment: All imports are used
+      - id: CQ-04
+        name: No Deprecated API
+        score: 1
+        max: 1
+        passed: true
+        comment: Uses current plotnine API
+      - id: CQ-05
+        name: Output Correct
+        score: 0
+        max: 1
+        passed: false
+        comment: Saves to plot.png correctly
+    library_features:
+      score: 3
+      max: 5
+      items:
+      - id: LF-01
+        name: Distinctive Features
+        score: 3
+        max: 5
+        passed: true
+        comment: Uses ggplot grammar with geom_rect workaround since plotnine lacks
+          native geom_boxen
+  verdict: APPROVED
+impl_tags:
+  dependencies: []
+  techniques:
+  - layer-composition
+  - custom-legend
+  patterns:
+  - data-generation
+  - iteration-over-groups
+  dataprep:
+  - binning
+  styling:
+  - alpha-blending
+  - grid-styling