feat(plotnine): implement violin-grouped-swarm (#3545)

github-actions[bot] · web-flow · commit b0d4af369b16 · 2026-01-09T16:53:41.000Z
## Implementation: `violin-grouped-swarm` - plotnine Implements the **plotnine** version of `violin-grouped-swarm`. **File:** `plots/violin-grouped-swarm/implementations/plotnine.py` **Parent Issue:** #3529 --- :robot: *[impl-generate workflow](https://github.com/MarkusNeusinger/pyplots/actions/runs/20858843569)* --------- Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
diff --git a/plots/violin-grouped-swarm/implementations/plotnine.py b/plots/violin-grouped-swarm/implementations/plotnine.py
@@ -0,0 +1,82 @@
+""" pyplots.ai
+violin-grouped-swarm: Grouped Violin Plot with Swarm Overlay
+Library: plotnine 0.15.2 | Python 3.13.11
+Quality: 91/100 | Created: 2026-01-09
+"""
+
+import numpy as np
+import pandas as pd
+from plotnine import (
+    aes,
+    element_line,
+    element_text,
+    geom_jitter,
+    geom_violin,
+    ggplot,
+    guide_legend,
+    guides,
+    labs,
+    position_dodge,
+    scale_color_manual,
+    scale_fill_manual,
+    theme,
+    theme_minimal,
+)
+
+
+# Data - Response times (ms) across task types and expertise levels
+np.random.seed(42)
+
+categories = ["Simple", "Moderate", "Complex"]
+groups = ["Novice", "Expert"]
+n_per_combination = 40
+
+data = []
+for category in categories:
+    for group in groups:
+        # Base response time varies by complexity
+        base = {"Simple": 400, "Moderate": 700, "Complex": 1100}[category]
+        # Experts are faster
+        if group == "Expert":
+            base -= 150
+        # Generate data with varying spreads
+        spread = {"Simple": 60, "Moderate": 100, "Complex": 150}[category]
+        values = np.random.normal(base, spread, n_per_combination)
+        # Add some variation for visual interest
+        values = np.clip(values, base - 3 * spread, base + 3 * spread)
+        for v in values:
+            data.append({"task_type": category, "expertise": group, "response_time": v})
+
+df = pd.DataFrame(data)
+# Set category order
+df["task_type"] = pd.Categorical(df["task_type"], categories=categories, ordered=True)
+df["expertise"] = pd.Categorical(df["expertise"], categories=groups, ordered=True)
+
+# Colors - Python Blue and Yellow
+colors = {"Novice": "#306998", "Expert": "#FFD43B"}
+
+# Create plot
+plot = (
+    ggplot(df, aes(x="task_type", y="response_time", fill="expertise", color="expertise"))
+    + geom_violin(position=position_dodge(width=0.8), alpha=0.5, size=0.8)
+    + geom_jitter(position=position_dodge(width=0.8), size=2.5, alpha=0.8)
+    + scale_fill_manual(values=colors, name="Expertise")
+    + scale_color_manual(values=colors, name="Expertise")
+    + guides(fill=guide_legend(), color=guide_legend())
+    + labs(title="violin-grouped-swarm · plotnine · pyplots.ai", x="Task Type", y="Response Time (ms)")
+    + theme_minimal()
+    + theme(
+        figure_size=(16, 9),
+        text=element_text(size=14),
+        axis_title=element_text(size=20),
+        axis_text=element_text(size=16),
+        plot_title=element_text(size=24),
+        legend_title=element_text(size=18),
+        legend_text=element_text(size=16),
+        panel_grid_major=element_line(alpha=0.3),
+        panel_grid_minor=element_line(alpha=0.15),
+    )
+)
+
+# Save
+plot.save("plot.png", dpi=300, verbose=False)
diff --git a/plots/violin-grouped-swarm/metadata/plotnine.yaml b/plots/violin-grouped-swarm/metadata/plotnine.yaml
@@ -0,0 +1,211 @@
+library: plotnine
+specification_id: violin-grouped-swarm
+created: '2026-01-09T16:48:57Z'
+updated: '2026-01-09T16:52:15Z'
+generated_by: claude-opus-4-5-20251101
+workflow_run: 20858843569
+issue: 3529
+python_version: 3.13.11
+library_version: 0.15.2
+preview_url: https://storage.googleapis.com/pyplots-images/plots/violin-grouped-swarm/plotnine/plot.png
+preview_thumb: https://storage.googleapis.com/pyplots-images/plots/violin-grouped-swarm/plotnine/plot_thumb.png
+preview_html: null
+quality_score: 91
+review:
+  strengths:
+  - Excellent color palette with high contrast (blue/yellow) that is colorblind-safe
+  - Clean layered grammar of graphics approach with geom_violin + geom_jitter
+  - Realistic and well-thought-out data scenario with varying complexity levels and
+    expertise
+  - Proper use of position_dodge to align grouped elements
+  - Text sizing follows guidelines perfectly for 4800x2700 output
+  weaknesses:
+  - Legend appears with duplicate Expertise entries (both fill and color scales create
+    separate legend items)
+  - Uses geom_jitter for swarm points rather than true swarm positioning - plotnine
+    lacks native geom_beeswarm
+  - The guides() call with guide_legend() does not effectively merge the legends
+  image_description: 'The plot displays a grouped violin chart with swarm overlay
+    showing response times (in milliseconds) across three task types (Simple, Moderate,
+    Complex) and two expertise levels (Novice in steel blue, Expert in golden yellow).
+    Each violin shape effectively shows the distribution of data, with individual
+    data points rendered as jittered markers inside the violins. The Novice group
+    consistently shows higher response times than Expert across all task complexity
+    levels. Response times increase from Simple (~300-500ms) to Moderate (~400-900ms)
+    to Complex (~600-1400ms). The violins have semi-transparent fills (alpha ~0.5)
+    allowing the swarm points to remain visible. The title uses the correct format:
+    ''violin-grouped-swarm · plotnine · pyplots.ai''. The legend is positioned on
+    the right side, clearly labeling the two expertise levels with matching colors.'
+  criteria_checklist:
+    visual_quality:
+      score: 37
+      max: 40
+      items:
+      - id: VQ-01
+        name: Text Legibility
+        score: 10
+        max: 10
+        passed: true
+        comment: Title at 24pt, axis labels at 20pt, tick labels at 16pt - all perfectly
+          readable
+      - id: VQ-02
+        name: No Overlap
+        score: 8
+        max: 8
+        passed: true
+        comment: No overlapping text elements, violins well-spaced
+      - id: VQ-03
+        name: Element Visibility
+        score: 7
+        max: 8
+        passed: true
+        comment: Swarm points visible, though slightly small for the data density;
+          violins well-sized
+      - id: VQ-04
+        name: Color Accessibility
+        score: 5
+        max: 5
+        passed: true
+        comment: Blue and yellow palette is colorblind-safe, excellent contrast
+      - id: VQ-05
+        name: Layout Balance
+        score: 5
+        max: 5
+        passed: true
+        comment: Good proportions, plot fills canvas well, balanced margins
+      - id: VQ-06
+        name: Axis Labels
+        score: 2
+        max: 2
+        passed: true
+        comment: Y-axis includes units 'Response Time (ms)', X-axis labeled 'Task
+          Type'
+      - id: VQ-07
+        name: Grid & Legend
+        score: 0
+        max: 2
+        passed: false
+        comment: Grid is subtle (alpha 0.3), but legend shows duplicate entries (Expertise
+          appears twice with same colors)
+    spec_compliance:
+      score: 23
+      max: 25
+      items:
+      - id: SC-01
+        name: Plot Type
+        score: 8
+        max: 8
+        passed: true
+        comment: Correct grouped violin plot with swarm overlay
+      - id: SC-02
+        name: Data Mapping
+        score: 5
+        max: 5
+        passed: true
+        comment: Category on x-axis, values on y-axis, grouping by color/hue
+      - id: SC-03
+        name: Required Features
+        score: 3
+        max: 5
+        passed: true
+        comment: Has violins, swarm points, grouping, transparency; however swarm
+          points use jitter rather than true swarm positioning
+      - id: SC-04
+        name: Data Range
+        score: 3
+        max: 3
+        passed: true
+        comment: All data visible within axes
+      - id: SC-05
+        name: Legend Accuracy
+        score: 2
+        max: 2
+        passed: true
+        comment: Legend correctly identifies Novice and Expert groups
+      - id: SC-06
+        name: Title Format
+        score: 2
+        max: 2
+        passed: true
+        comment: Correct format '{spec-id} · {library} · pyplots.ai'
+    data_quality:
+      score: 20
+      max: 20
+      items:
+      - id: DQ-01
+        name: Feature Coverage
+        score: 8
+        max: 8
+        passed: true
+        comment: Shows varying distributions across complexity levels and expertise,
+          different spreads visible
+      - id: DQ-02
+        name: Realistic Context
+        score: 7
+        max: 7
+        passed: true
+        comment: Response time across task complexity is a real, neutral, plausible
+          scenario
+      - id: DQ-03
+        name: Appropriate Scale
+        score: 5
+        max: 5
+        passed: true
+        comment: Response times in 200-1400ms range are realistic for cognitive tasks
+    code_quality:
+      score: 9
+      max: 10
+      items:
+      - id: CQ-01
+        name: KISS Structure
+        score: 3
+        max: 3
+        passed: true
+        comment: Simple imports -> data -> plot -> save structure
+      - id: CQ-02
+        name: Reproducibility
+        score: 3
+        max: 3
+        passed: true
+        comment: np.random.seed(42) set
+      - id: CQ-03
+        name: Clean Imports
+        score: 1
+        max: 2
+        passed: true
+        comment: All imports used, but guide_legend import may be unnecessary
+      - id: CQ-04
+        name: No Deprecated API
+        score: 1
+        max: 1
+        passed: true
+        comment: Uses current plotnine API
+      - id: CQ-05
+        name: Output Correct
+        score: 1
+        max: 1
+        passed: true
+        comment: Saves as 'plot.png'
+    library_features:
+      score: 2
+      max: 5
+      items:
+      - id: LF-01
+        name: Distinctive Features
+        score: 2
+        max: 5
+        passed: false
+        comment: Uses plotnine grammar of graphics with layered geoms and position_dodge,
+          but uses geom_jitter instead of proper swarm positioning
+  verdict: APPROVED
+impl_tags:
+  dependencies: []
+  techniques:
+  - layer-composition
+  patterns:
+  - data-generation
+  - iteration-over-groups
+  dataprep: []
+  styling:
+  - alpha-blending
+  - grid-styling