CCPBioSim
diff --git a/‎.github/workflows/ci.yaml‎
Lines changed: 45 additions & 0 deletions b/‎.github/workflows/ci.yaml‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎Makefile‎
Lines changed: 9 additions & 3 deletions b/‎Makefile‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎README.md‎
Lines changed: 8 additions & 7 deletions b/‎README.md‎
Lines changed: 8 additions & 7 deletions
diff --git a/‎devtools/scripts/execute_and_convert_notebooks.py‎
Lines changed: 145 additions & 0 deletions b/‎devtools/scripts/execute_and_convert_notebooks.py‎
Lines changed: 145 additions & 0 deletions
diff --git a/‎devtools/scripts/remove_notebook_solutions.py‎
Lines changed: 73 additions & 0 deletions b/‎devtools/scripts/remove_notebook_solutions.py‎
Lines changed: 73 additions & 0 deletions
@@ -0,0 +1,45 @@
+name: CI
+
+concurrency:
+  group: ${{ github.ref }}
+  cancel-in-progress: true
+
+on:
+  push: { branches: [ "main" ] }
+  pull_request: { branches: [ "main" ] }
+
+jobs:
+  test:
+
+    runs-on: ubuntu-latest
+    container: condaforge/mambaforge:latest
+
+    steps:
+    - uses: actions/checkout@v4
+
+    - name: Run CI
+      # Ensure the step runs under bash so `pipefail` is supported in the shell flags
+      # The `{0}` placeholder is replaced by the step commands by GitHub Actions.
+      shell: bash -eo pipefail {0}
+      run: |
+        # Fail fast: any command that exits non-zero will stop the job
+        set -euo pipefail
+        IFS=$'\n\t'
+
+        apt update && apt install -y git make
+
+        make env-dev
+        make create-student-nb
+        make run-nb-and-convert-to-md
+
+    - name: Commit and push notebook.md files
+      run: |
+        git config --global --add safe.directory "$GITHUB_WORKSPACE"
+        git config --global user.name "github-actions[bot]"
+        git config --global user.email "github-actions[bot]@users.noreply.github.com"
+        git add notebooks-rendered/
+        git add notebooks/
+        git commit -m "Add generated notebook.md and answerless notebook files [skip ci]" || echo "No changes to commit"
+        git push
+      env:
+        GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
@@ -2,7 +2,7 @@ ENV_NAME := openff-env
 
 CONDA_ENV_RUN   = conda run --no-capture-output --name $(ENV_NAME)
 
-.PHONY: env env-dev clean-nb format-nb run-nb
+.PHONY: env env-dev clean-nb format-nb run-nb create-student-nb
 
 env:
 	mamba create     --name $(ENV_NAME)
@@ -21,8 +21,14 @@ clean-nb:
 format-nb:
 	$(CONDA_ENV_RUN) find . -name "*.ipynb" -exec nbqa ruff --fix {} --ignore E402 \;
 
+create-student-nb:
+	$(CONDA_ENV_RUN) python devtools/scripts/remove_notebook_solutions.py notebooks_with_solutions/small_molecule_parameterisation.ipynb notebooks/small_molecule_parameterisation.ipynb
+	$(CONDA_ENV_RUN) python devtools/scripts/remove_notebook_solutions.py notebooks_with_solutions/protein_ligand_complex_parameterisation_and_md.ipynb notebooks/protein_ligand_complex_parameterisation_and_md.ipynb
+
 run-nb:
-	$(CONDA_ENV_RUN) find . -name "*.ipynb" -exec jupyter nbconvert --to notebook --execute --inplace {} \;
+	$(CONDA_ENV_RUN) find notebooks_with_solutions -name "*.ipynb" -exec jupyter nbconvert --to notebook --execute --inplace {} \;
 
 run-nb-and-convert-to-md:
-	$(CONDA_ENV_RUN) find . -name "*.ipynb" -exec jupyter nbconvert --to markdown --execute --output-dir notebooks-rendered {} \;
+	$(CONDA_ENV_RUN) python devtools/scripts/execute_and_convert_notebooks.py \
+		--input-dir notebooks_with_solutions --output-dir notebooks-rendered \
+		--skip-tag ci_skip
@@ -2,25 +2,26 @@
 
 [![CI](https://github.com/openforcefield/ccpbiosim-2025/actions/workflows/ci.yaml/badge.svg)](https://github.com/openforcefield/ccpbiosim-2025/actions/workflows/ci.yaml)
 
+These tutorials were delivered at the 2025 CCPBioSim training week, but are suitable for self-guided learning.
+
 Presenters:
 
 * Danny Cole
 * Finlay Clark
 
-## Agenda
+## Materials
 
-### Half session - Wednesday Morning (11.30 AM - 1 PM)
+We recommend you view the materials in the following order:
 
-* Talk - Intro to OpenFF
+* Talk: [Intro to OpenFF](talk-cole-openFFintro.pdf)
 * Notebook: [Parameterising small molecules with OpenFF](notebooks/small_molecule_parameterisation.ipynb)
-
-### Half session - Wednesday Afternoon (2.00 PM - 3.00 PM)
-
 * Notebook: [Parameterisation, molecular dynamics, and basic trajectory analysis for a protein-ligand complex](notebooks/protein_ligand_complex_parameterisation_and_md.ipynb)
 
+Answers to most exercises are given in the [notebooks_with_solutions directory](notebooks_with_solutions).
+
 ## Local installation
 
-If there are any issues with the provided cloud-hosted JupyterHub instance, or to use these notebooks outside of the workshop hours, use a Python distribution (we recommend [Mambaforge](https://docs.openforcefield.org/en/latest/install.html#quick-install-guide)) and create an environment from the provided YAML file:
+To use these notebooks on your local machine, we recommend using [mamba](https://docs.openforcefield.org/en/latest/install.html#quick-install-guide) to create an environment from the provided YAML file:
 
 ```shell
 $ mamba env create --file environment.yaml
 
@@ -0,0 +1,145 @@
+#!/usr/bin/env python3
+"""Execute and convert notebooks while skipping cells that have a given tag.
+
+This script:
+ - finds .ipynb files under --input-dir
+ - loads each notebook, removes cells that have the skip tag
+ - executes the notebook with nbconvert ExecutePreprocessor
+ - exports the executed notebook to a markdown file under --output-dir
+
+Use this in CI to skip interactive or long-running cells by adding a tag
+to those cells, e.g. tags: ["ci_skip"]
+
+Example:
+  python devtools/scripts/execute_and_convert_notebooks.py \
+    --input-dir notebooks_with_solutions --output-dir notebooks-rendered \
+    --skip-tag ci_skip --timeout 600
+"""
+import argparse
+import nbformat
+from nbformat import NotebookNode
+import sys
+from pathlib import Path
+from typing import List, Optional
+from nbconvert.preprocessors import ExecutePreprocessor
+from nbconvert.exporters import MarkdownExporter
+from copy import deepcopy
+
+
+def notebook_files(input_dir: str) -> List[Path]:
+    p = Path(input_dir)
+    return sorted(p.rglob("*.ipynb"))
+
+
+def remove_tagged_cells(nb: NotebookNode, tag: Optional[str]) -> List[NotebookNode]:
+    if not tag:
+        return list(nb.cells)
+    return [
+        cell for cell in nb.cells if tag not in cell.get("metadata", {}).get("tags", [])
+    ]
+
+
+def has_skip_tag(cell: NotebookNode, tag: Optional[str]) -> bool:
+    if not tag:
+        return False
+    return tag in cell.get("metadata", {}).get("tags", [])
+
+
+def execute_notebook(
+    nb: NotebookNode,
+    timeout: int,
+    kernel_name: str,
+    cwd: Optional[str] = None,
+    skip_tag: Optional[str] = None,
+) -> NotebookNode:
+    """Execute the notebook but skip execution of cells that have skip_tag.
+
+    Implementation: run a deep copy of the notebook where skipped code cells
+    are replaced with a noop (`pass`) so the ExecutePreprocessor executes but
+    does nothing for those cells. After execution, copy outputs and
+    execution_count back to the original notebook so the original cell
+    sources are preserved for conversion.
+    """
+    exec_nb = deepcopy(nb)
+    # replace skipped code cells with a harmless noop so they won't run
+    for cell in exec_nb.cells:
+        if cell.get("cell_type") == "code" and has_skip_tag(cell, skip_tag):
+            cell.source = "pass\n"
+            # clear any existing outputs
+            cell.outputs = []
+            cell.execution_count = None
+
+    ep = ExecutePreprocessor(timeout=timeout, kernel_name=kernel_name)
+    ep.preprocess(exec_nb, {"metadata": {"path": cwd or "."}})
+
+    # copy outputs back to original notebook cells
+    for orig_cell, run_cell in zip(nb.cells, exec_nb.cells):
+        if orig_cell.get("cell_type") == "code":
+            orig_cell["outputs"] = run_cell.get("outputs", [])
+            orig_cell["execution_count"] = run_cell.get("execution_count", None)
+
+    return nb
+
+
+def convert_to_markdown(nb, out_path: Path):
+    exporter = MarkdownExporter()
+    body, resources = exporter.from_notebook_node(nb)
+    out_path.parent.mkdir(parents=True, exist_ok=True)
+    out_path.write_text(body, encoding="utf8")
+
+
+def main(argv=None):
+    p = argparse.ArgumentParser()
+    p.add_argument("--input-dir", required=True)
+    p.add_argument("--output-dir", required=True)
+    p.add_argument(
+        "--skip-tag", default="ci_skip", help="Cell tag to remove before execution"
+    )
+    p.add_argument(
+        "--timeout",
+        type=int,
+        default=600,
+        help="ExecutePreprocessor timeout in seconds",
+    )
+    p.add_argument(
+        "--kernel", default="python3", help="Kernel name to use for execution"
+    )
+    args = p.parse_args(argv)
+
+    input_dir = Path(args.input_dir)
+    output_dir = Path(args.output_dir)
+    if not input_dir.exists():
+        print(f"Input directory not found: {input_dir}", file=sys.stderr)
+        return 2
+
+    files = notebook_files(input_dir)
+    if not files:
+        print(f"No notebooks found under {input_dir}")
+        return 0
+
+    exit_code = 0
+    for nb_path in files:
+        rel = nb_path.relative_to(input_dir)
+        out_md = output_dir / rel.with_suffix(".md")
+        print(f"Processing {nb_path} -> {out_md}")
+        try:
+            nb = nbformat.read(str(nb_path), as_version=4)
+            # execute in the notebook's parent directory to keep relative paths working
+            cwd = str(nb_path.parent)
+            nb = execute_notebook(
+                nb,
+                timeout=args.timeout,
+                kernel_name=args.kernel,
+                cwd=cwd,
+                skip_tag=args.skip_tag,
+            )
+            convert_to_markdown(nb, out_md)
+        except Exception as e:
+            print(f"ERROR processing {nb_path}: {e}", file=sys.stderr)
+            exit_code = 1
+
+    return exit_code
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
@@ -0,0 +1,73 @@
+"""
+Generate a student version of Jupyter notebooks by replacing
+cells tagged as 'solution' with empty code cells containing a placeholder.
+
+Usage:
+    python devtools/make_student.py input_notebook.ipynb output_notebook.ipynb
+"""
+
+from __future__ import annotations
+import sys
+from pathlib import Path
+import nbformat
+from nbformat.notebooknode import NotebookNode
+
+
+def make_student_version(
+    input_path: str | Path,
+    output_path: str | Path,
+    tag_to_replace: str = "solution",
+) -> None:
+    """
+    Create a student version of a Jupyter notebook by replacing all cells
+    tagged with `tag_to_replace` by placeholder code cells.
+
+    Parameters
+    ----------
+    input_path : str | Path
+        Path to the input notebook (typically the solutions version).
+    output_path : str | Path
+        Path where the cleaned student notebook should be written.
+    tag_to_replace : str, optional
+        Tag identifying cells that should be replaced. Default is 'solution'.
+    """
+    input_path = Path(input_path)
+    output_path = Path(output_path)
+
+    nb: NotebookNode = nbformat.read(input_path, as_version=4)
+    new_cells: list[NotebookNode] = []
+
+    for cell in nb.cells:
+        tags: list[str] = cell.get("metadata", {}).get("tags", [])
+
+        if tag_to_replace in tags:
+            # Replace tagged cell with placeholder
+            placeholder = nbformat.v4.new_code_cell(
+                source="# your solution here",
+                metadata={"tags": ["placeholder"]},
+            )
+            new_cells.append(placeholder)
+        else:
+            # Clean up execution metadata
+            if cell.cell_type == "code":
+                cell.outputs = []
+                cell.execution_count = None
+            new_cells.append(cell)
+
+    nb.cells = new_cells
+    nbformat.write(nb, output_path)
+    print(f"✅ Wrote student notebook: {output_path}")
+
+
+def main() -> None:
+    """CLI entry point."""
+    if len(sys.argv) != 3:
+        print("Usage: python devtools/make_student.py input.ipynb output.ipynb")
+        sys.exit(1)
+
+    input_path, output_path = sys.argv[1], sys.argv[2]
+    make_student_version(input_path, output_path)
+
+
+if __name__ == "__main__":
+    main()