fastmachinelearning
diff --git a/‎1_getting_started/1a_train_keras.ipynb‎
Lines changed: 2 additions & 13 deletions b/‎1_getting_started/1a_train_keras.ipynb‎
Lines changed: 2 additions & 13 deletions
diff --git a/‎1_getting_started/1b_train_pytorch.ipynb‎
Lines changed: 2 additions & 13 deletions b/‎1_getting_started/1b_train_pytorch.ipynb‎
Lines changed: 2 additions & 13 deletions
diff --git a/‎1_getting_started/1c_hls4ml_synth.ipynb‎
Lines changed: 2 additions & 17 deletions b/‎1_getting_started/1c_hls4ml_synth.ipynb‎
Lines changed: 2 additions & 17 deletions
diff --git a/‎2_quantization/2a_qkeras.ipynb‎
Lines changed: 2 additions & 8 deletions b/‎2_quantization/2a_qkeras.ipynb‎
Lines changed: 2 additions & 8 deletions
diff --git a/‎2_quantization/2b_brevitas.ipynb‎
Lines changed: 2 additions & 8 deletions b/‎2_quantization/2b_brevitas.ipynb‎
Lines changed: 2 additions & 8 deletions
diff --git a/‎3_advanced_config/3a_reuse_factor.ipynb‎
Lines changed: 3 additions & 33 deletions b/‎3_advanced_config/3a_reuse_factor.ipynb‎
Lines changed: 3 additions & 33 deletions
diff --git a/‎3_advanced_config/3b_profiling.ipynb‎
Lines changed: 2 additions & 19 deletions b/‎3_advanced_config/3b_profiling.ipynb‎
Lines changed: 2 additions & 19 deletions
diff --git a/‎4_advanced_models/4a_qkeras_cnn_svhn.ipynb‎
Lines changed: 3 additions & 26 deletions b/‎4_advanced_models/4a_qkeras_cnn_svhn.ipynb‎
Lines changed: 3 additions & 26 deletions
diff --git a/‎6_more_models/6a_bdt.ipynb‎
Lines changed: 3 additions & 19 deletions b/‎6_more_models/6a_bdt.ipynb‎
Lines changed: 3 additions & 19 deletions
diff --git a/‎_toc.yml‎
Lines changed: 9 additions & 10 deletions b/‎_toc.yml‎
Lines changed: 9 additions & 10 deletions
@@ -115,18 +115,7 @@
    "id": "f3b4d39e",
    "metadata": {},
    "outputs": [],
-   "source": [
-    "scaler = StandardScaler()\n",
-    "X_train_val = scaler.fit_transform(X_train_val)\n",
-    "X_test = scaler.transform(X_test)\n",
-    "\n",
-    "os.makedirs('../data', exist_ok=True)\n",
-    "np.save('../data/X_train_val.npy', X_train_val)\n",
-    "np.save('../data/X_test.npy', X_test)\n",
-    "np.save('../data/y_train_val.npy', y_train_val)\n",
-    "np.save('../data/y_test.npy', y_test)\n",
-    "np.save('../data/classes.npy', le.classes_)"
-   ]
+   "source": "scaler = StandardScaler()\nX_train_val = scaler.fit_transform(X_train_val)\nX_test = scaler.transform(X_test)\n\nos.makedirs('../data/jet-tagging', exist_ok=True)\nnp.save('../data/jet-tagging/X_train_val.npy', X_train_val)\nnp.save('../data/jet-tagging/X_test.npy', X_test)\nnp.save('../data/jet-tagging/y_train_val.npy', y_train_val)\nnp.save('../data/jet-tagging/y_test.npy', y_test)\nnp.save('../data/jet-tagging/classes.npy', le.classes_)"
   },
   {
    "cell_type": "markdown",
@@ -259,4 +248,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
@@ -110,18 +110,7 @@
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "scaler = StandardScaler()\n",
-    "X_train_val = scaler.fit_transform(X_train_val)\n",
-    "X_test = scaler.transform(X_test)\n",
-    "\n",
-    "os.makedirs('../data', exist_ok=True)\n",
-    "np.save('../data/X_train_val.npy', X_train_val)\n",
-    "np.save('../data/X_test.npy', X_test)\n",
-    "np.save('../data/y_train_val.npy', y_train_val)\n",
-    "np.save('../data/y_test.npy', y_test)\n",
-    "np.save('../data/classes.npy', le.classes_)"
-   ]
+   "source": "scaler = StandardScaler()\nX_train_val = scaler.fit_transform(X_train_val)\nX_test = scaler.transform(X_test)\n\nos.makedirs('../data/jet-tagging', exist_ok=True)\nnp.save('../data/jet-tagging/X_train_val.npy', X_train_val)\nnp.save('../data/jet-tagging/X_test.npy', X_test)\nnp.save('../data/jet-tagging/y_train_val.npy', y_train_val)\nnp.save('../data/jet-tagging/y_test.npy', y_test)\nnp.save('../data/jet-tagging/classes.npy', le.classes_)"
   },
   {
    "cell_type": "markdown",
@@ -278,4 +267,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
@@ -27,22 +27,7 @@
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ['KERAS_BACKEND'] = 'tensorflow'\n",
-    "\n",
-    "import numpy as np\n",
-    "import matplotlib.pyplot as plt\n",
-    "import sys\n",
-    "sys.path.append('..')\n",
-    "import plotting\n",
-    "import hls4ml\n",
-    "\n",
-    "# Load the test dataset\n",
-    "X_test  = np.ascontiguousarray(np.load('../data/X_test.npy'),  dtype=np.float32)\n",
-    "y_test  = np.load('../data/y_test.npy')\n",
-    "classes = np.load('../data/classes.npy', allow_pickle=True)"
-   ]
+   "source": "import os\nos.environ['KERAS_BACKEND'] = 'tensorflow'\n\nimport numpy as np\nimport matplotlib.pyplot as plt\nimport sys\nsys.path.append('..')\nimport plotting\nimport hls4ml\n\n# Load the test dataset\nX_test  = np.ascontiguousarray(np.load('../data/jet-tagging/X_test.npy'),  dtype=np.float32)\ny_test  = np.load('../data/jet-tagging/y_test.npy')\nclasses = np.load('../data/jet-tagging/classes.npy', allow_pickle=True)"
   },
   {
    "cell_type": "markdown",
@@ -324,4 +309,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
@@ -51,13 +51,7 @@
    "id": "cell-3",
    "metadata": {},
    "outputs": [],
-   "source": [
-    "X_train_val = np.load('../data/X_train_val.npy')\n",
-    "X_test      = np.load('../data/X_test.npy')\n",
-    "y_train_val = np.load('../data/y_train_val.npy')\n",
-    "y_test      = np.load('../data/y_test.npy')\n",
-    "classes     = np.load('../data/classes.npy', allow_pickle=True)"
-   ]
+   "source": "X_train_val = np.load('../data/jet-tagging/X_train_val.npy')\nX_test      = np.load('../data/jet-tagging/X_test.npy')\ny_train_val = np.load('../data/jet-tagging/y_train_val.npy')\ny_test      = np.load('../data/jet-tagging/y_test.npy')\nclasses     = np.load('../data/jet-tagging/classes.npy', allow_pickle=True)"
   },
   {
    "cell_type": "markdown",
@@ -345,4 +339,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
@@ -59,13 +59,7 @@
    "id": "cell-3",
    "metadata": {},
    "outputs": [],
-   "source": [
-    "X_train_val = np.load('../data/X_train_val.npy')\n",
-    "X_test      = np.load('../data/X_test.npy')\n",
-    "y_train_val = np.load('../data/y_train_val.npy')\n",
-    "y_test      = np.load('../data/y_test.npy')\n",
-    "classes     = np.load('../data/classes.npy', allow_pickle=True)"
-   ]
+   "source": "X_train_val = np.load('../data/jet-tagging/X_train_val.npy')\nX_test      = np.load('../data/jet-tagging/X_test.npy')\ny_train_val = np.load('../data/jet-tagging/y_train_val.npy')\ny_test      = np.load('../data/jet-tagging/y_test.npy')\nclasses     = np.load('../data/jet-tagging/classes.npy', allow_pickle=True)"
   },
   {
    "cell_type": "markdown",
@@ -419,4 +413,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
@@ -30,25 +30,7 @@
    "id": "cell-2",
    "metadata": {},
    "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ['KERAS_BACKEND'] = 'tensorflow'\n",
-    "\n",
-    "import numpy as np\n",
-    "import matplotlib.pyplot as plt\n",
-    "import sys\n",
-    "sys.path.append('..')\n",
-    "import plotting\n",
-    "import hls4ml\n",
-    "from sklearn.metrics import accuracy_score\n",
-    "\n",
-    "%matplotlib inline\n",
-    "\n",
-    "# Load the data\n",
-    "X_test  = np.ascontiguousarray(np.load('../data/X_test.npy'),  dtype=np.float32)\n",
-    "y_test  = np.load('../data/y_test.npy')\n",
-    "classes = np.load('../data/classes.npy', allow_pickle=True)"
-   ]
+   "source": "import os\nos.environ['KERAS_BACKEND'] = 'tensorflow'\n\nimport numpy as np\nimport matplotlib.pyplot as plt\nimport sys\nsys.path.append('..')\nimport plotting\nimport hls4ml\nfrom sklearn.metrics import accuracy_score\n\n%matplotlib inline\n\n# Load the data\nX_test  = np.ascontiguousarray(np.load('../data/jet-tagging/X_test.npy'),  dtype=np.float32)\ny_test  = np.load('../data/jet-tagging/y_test.npy')\nclasses = np.load('../data/jet-tagging/classes.npy', allow_pickle=True)"
   },
   {
    "cell_type": "markdown",
@@ -103,19 +85,7 @@
    "cell_type": "markdown",
    "id": "cell-5",
    "metadata": {},
-   "source": [
-    "## What is the ReuseFactor?\n",
-    "\n",
-    "In the default (`ReuseFactor = 1`) configuration, hls4ml instantiates one multiplier for every weight in the network. All multiplications for a given layer happen in a single clock cycle, giving the minimum possible latency — but using the most multipliers.\n",
-    "\n",
-    "Setting `ReuseFactor = N` tells hls4ml to time-multiplex the same multiplier hardware across `N` weight-input pairs. This means the layer takes `N` clock cycles to compute instead of one, but uses roughly `1/N` as many multipliers.\n",
-    "\n",
-    "![Reuse factor diagram](../images/reuse.png)\n",
-    "\n",
-    "The reuse factor must evenly divide the number of weights in each layer. For example, the first layer has `16 × 64 = 1024` weights, so valid reuse factors include 1, 2, 4, 8, 16, 32, 64, etc.\n",
-    "\n",
-    "Changing the reuse factor does **not** change the model accuracy — the same arithmetic is performed, just spread over more clock cycles. We will verify this below."
-   ]
+   "source": "## What is the ReuseFactor?\n\nIn the default (`ReuseFactor = 1`) configuration, hls4ml instantiates one multiplier for every weight in the network. All multiplications for a given layer happen in a single clock cycle, giving the minimum possible latency — but using the most multipliers.\n\nSetting `ReuseFactor = N` tells hls4ml to time-multiplex the same multiplier hardware across `N` weight-input pairs. This means the layer takes `N` clock cycles to compute instead of one, but uses roughly `1/N` as many multipliers.\n\n![Reuse factor diagram](../images/part3a_reuse_factor.png)\n\nThe reuse factor must evenly divide the number of weights in each layer. For example, the first layer has `16 × 64 = 1024` weights, so valid reuse factors include 1, 2, 4, 8, 16, 32, 64, etc.\n\nChanging the reuse factor does **not** change the model accuracy — the same arithmetic is performed, just spread over more clock cycles. We will verify this below."
   },
   {
    "cell_type": "markdown",
@@ -275,4 +245,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
@@ -34,24 +34,7 @@
    "id": "cell-2",
    "metadata": {},
    "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ['KERAS_BACKEND'] = 'tensorflow'\n",
-    "\n",
-    "import numpy as np\n",
-    "import matplotlib.pyplot as plt\n",
-    "import sys\n",
-    "sys.path.append('..')\n",
-    "import plotting\n",
-    "import hls4ml\n",
-    "from sklearn.metrics import accuracy_score\n",
-    "\n",
-    "%matplotlib inline\n",
-    "\n",
-    "X_test  = np.ascontiguousarray(np.load('../data/X_test.npy'),  dtype=np.float32)\n",
-    "y_test  = np.load('../data/y_test.npy')\n",
-    "classes = np.load('../data/classes.npy', allow_pickle=True)"
-   ]
+   "source": "import os\nos.environ['KERAS_BACKEND'] = 'tensorflow'\n\nimport numpy as np\nimport matplotlib.pyplot as plt\nimport sys\nsys.path.append('..')\nimport plotting\nimport hls4ml\nfrom sklearn.metrics import accuracy_score\n\n%matplotlib inline\n\nX_test  = np.ascontiguousarray(np.load('../data/jet-tagging/X_test.npy'),  dtype=np.float32)\ny_test  = np.load('../data/jet-tagging/y_test.npy')\nclasses = np.load('../data/jet-tagging/classes.npy', allow_pickle=True)"
   },
   {
    "cell_type": "markdown",
@@ -385,4 +368,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
@@ -4,17 +4,7 @@
    "cell_type": "markdown",
    "id": "4a-0",
    "metadata": {},
-   "source": [
-    "# Part 4a: Convolutional Neural Networks with QKeras on the SVHN dataset\n",
-    "\n",
-    "In this notebook we train a quantized convolutional neural network (CNN) on the [Street View House Numbers (SVHN)](http://ufldl.stanford.edu/housenumbers/) dataset and deploy it with hls4ml.\n",
-    "\n",
-    "The SVHN dataset consists of real-world images of house numbers extracted from Google Street View, cropped to 32×32 RGB pixels. Unlike MNIST it is a harder, more realistic problem: images can contain more than one digit, and the centre digit defines the label. Each image belongs to one of 10 classes (digits 0–9).\n",
-    "\n",
-    "![SVHN examples from the test set](../images/test.png)\n",
-    "\n",
-    "The dataset has 73,257 training images and 26,032 test images."
-   ]
+   "source": "# Part 4a: Convolutional Neural Networks with QKeras on the SVHN dataset\n\nIn this notebook we train a quantized convolutional neural network (CNN) on the [Street View House Numbers (SVHN)](http://ufldl.stanford.edu/housenumbers/) dataset and deploy it with hls4ml.\n\nThe SVHN dataset consists of real-world images of house numbers extracted from Google Street View, cropped to 32×32 RGB pixels. Unlike MNIST it is a harder, more realistic problem: images can contain more than one digit, and the centre digit defines the label. Each image belongs to one of 10 classes (digits 0–9).\n\n![SVHN examples from the test set](../images/part4a_test_images.png)\n\nThe dataset has 73,257 training images and 26,032 test images."
   },
   {
    "cell_type": "code",
@@ -276,20 +266,7 @@
    "cell_type": "markdown",
    "id": "4a-13",
    "metadata": {},
-   "source": [
-    "## Convolutions in hls4ml\n",
-    "\n",
-    "hls4ml supports two I/O modes for neural networks:\n",
-    "\n",
-    "- **`io_parallel`**: All inputs arrive simultaneously. Suitable for small models, when all activations fit into registers.\n",
-    "- **`io_stream`**: Data flows through the network one element at a time via FIFO buffers. Required for larger CNNs, when the full feature maps are too large to hold in registers. Shift registers maintain a sliding window of `kernel_height − 1` rows, feeding the convolution kernel one pixel at a time.\n",
-    "\n",
-    "See the [hls4ml documentation](https://fastmachinelearning.org/hls4ml/concepts.html) for more details.\n",
-    "\n",
-    "![Conv2D stream implementation](../images/conv2d_animation.gif)\n",
-    "\n",
-    "**Note on softmax precision:** using `auto` precision for the output of the last dense layer can produce accumulators wider than the softmax look-up tables can handle. We cap this manually with `fixed<16,6,RND,SAT>`."
-   ]
+   "source": "## Convolutions in hls4ml\n\nhls4ml supports two I/O modes for neural networks:\n\n- **`io_parallel`**: All inputs arrive simultaneously. Suitable for small models, when all activations fit into registers.\n- **`io_stream`**: Data flows through the network one element at a time via FIFO buffers. Required for larger CNNs, when the full feature maps are too large to hold in registers. Shift registers maintain a sliding window of `kernel_height − 1` rows, feeding the convolution kernel one pixel at a time.\n\nSee the [hls4ml documentation](https://fastmachinelearning.org/hls4ml/concepts.html) for more details.\n\n![Conv2D stream implementation](../images/part4a_conv2d_animation.gif)\n\n**Note on softmax precision:** using `auto` precision for the output of the last dense layer can produce accumulators wider than the softmax look-up tables can handle. We cap this manually with `fixed<16,6,RND,SAT>`."
   },
   {
    "cell_type": "code",
@@ -440,4 +417,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
@@ -78,13 +78,7 @@
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "X_train_val = np.load('../data/X_train_val.npy')\n",
-    "X_test = np.load('../data/X_test.npy')\n",
-    "y_train_val_one_hot = np.load('../data/y_train_val.npy')\n",
-    "y_test_one_hot = np.load('../data/y_test.npy')\n",
-    "classes = np.load('../data/classes.npy', allow_pickle=True)"
-   ]
+   "source": "X_train_val = np.load('../data/jet-tagging/X_train_val.npy')\nX_test = np.load('../data/jet-tagging/X_test.npy')\ny_train_val_one_hot = np.load('../data/jet-tagging/y_train_val.npy')\ny_test_one_hot = np.load('../data/jet-tagging/y_test.npy')\nclasses = np.load('../data/jet-tagging/classes.npy', allow_pickle=True)"
   },
   {
    "cell_type": "markdown",
@@ -485,17 +479,7 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "## Build the model\n",
-    "\n",
-    "Now we run `build` again, running HLS Synthesis, Logic Synthesis and Place & Route, finally producing a bitfile and an archive of files that we'll need to run inference on the pynq-z2 board. \n",
-    "\n",
-    "**This step takes around 20 minutes.**\n",
-    "\n",
-    "The floorplan of the bitfile should like something like this, where the individual tree modules are highlighted in different colours:\n",
-    "\n",
-    "<img src=\"../images/part5_floorplan.png\" width=\"300\" />"
-   ]
+   "source": "## Build the model\n\nNow we run `build` again, running HLS Synthesis, Logic Synthesis and Place & Route, finally producing a bitfile and an archive of files that we'll need to run inference on the pynq-z2 board. \n\n**This step takes around 20 minutes.**\n\nThe floorplan of the bitfile should like something like this, where the individual tree modules are highlighted in different colours:\n\n<img src=\"../images/part6a_bdt_floorplan.png\" width=\"300\" />"
   },
   {
    "cell_type": "code",
@@ -547,4 +531,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
+}
@@ -1,13 +1,12 @@
 format: jb-book
 root: README.md
 chapters:
- - file: part1_getting_started.ipynb
- - file: part2_advanced_config.ipynb
- - file: part3_compression.ipynb
- - file: part4_quantization.ipynb
- - file: part5_bdt.ipynb
- - file: part6_cnns.ipynb
- - file: part7a_bitstream.ipynb
- - file: part7b_deployment.ipynb
- - file: part7c_validation.ipynb
- - file: part8_symbolic_regression.ipynb
+ - file: 1_getting_started/1a_train_keras.ipynb
+ - file: 1_getting_started/1b_train_pytorch.ipynb
+ - file: 1_getting_started/1c_hls4ml_synth.ipynb
+ - file: 2_quantization/2a_qkeras.ipynb
+ - file: 2_quantization/2b_brevitas.ipynb
+ - file: 3_advanced_config/3a_reuse_factor.ipynb
+ - file: 3_advanced_config/3b_profiling.ipynb
+ - file: 4_advanced_models/4a_qkeras_cnn_svhn.ipynb
+ - file: 6_more_models/6a_bdt.ipynb