Skip to content

Commit f0c05d0

Browse files
committed
final cleanup
1 parent e261d9c commit f0c05d0

6 files changed

Lines changed: 17 additions & 7 deletions

File tree

include/bfloat16.hpp

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,8 @@
1+
/*
2+
// Copyright (c) 2024-2026 Ben Ashbaugh
3+
//
4+
// SPDX-License-Identifier: MIT
5+
*/
16
#pragma once
27

38
#include <cmath>

include/util.hpp

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,9 @@
77

88
#include <CL/opencl.hpp>
99

10+
#include <cctype>
11+
#include <cstdio>
12+
#include <cstring>
1013
#include <fstream>
1114
#include <iterator>
1215
#include <string>

samples/20_matrixexperiments-bf16/main.cpp

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,10 +10,12 @@
1010

1111
#include <algorithm>
1212
#include <chrono>
13+
#include <cmath>
14+
#include <cstdint>
1315
#include <iostream>
16+
#include <random>
1417
#include <sstream>
1518
#include <string>
16-
#include <random>
1719
#include <vector>
1820

1921
#include "bfloat16.hpp"

samples/20_matrixexperiments-i8/README.md

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,6 @@ This sample will optionally use the following OpenCL extensions:
5252
| `--wallclock` | n/a | Measure performance using wallclock time instead of event profiling.
5353
| `--skipinit` | n/a | Skip initialization of source matrices.
5454
| `--roundrobin` | n/a | Use round robin thread scheduling.
55-
| `--threshold <float>` | 0.01 | Set the threshold used when validating results.
5655
| `--mask <int>` | ~0 | Set a mask to only run a subset of tests.
5756

5857
By default, the source matrices are populated with random data.

samples/20_matrixexperiments-i8/main.cpp

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -10,10 +10,12 @@
1010

1111
#include <algorithm>
1212
#include <chrono>
13+
#include <cmath>
14+
#include <cstdint>
1315
#include <iostream>
16+
#include <random>
1417
#include <sstream>
1518
#include <string>
16-
#include <random>
1719
#include <vector>
1820

1921
#include "util.hpp"
@@ -29,7 +31,6 @@ bool wallclock = false;
2931
bool skipinit = false;
3032
bool roundRobin = false;
3133
int testIterations = 16;
32-
float threshold = 0.01f;
3334

3435
std::string makeTestName(
3536
const std::string &func,
@@ -160,7 +161,6 @@ void check_results(
160161
const std::vector<T>& C,
161162
const std::vector<T>& C_ref)
162163
{
163-
float err = 0.f;
164164
for (size_t m = 0; m < M; m++) {
165165
for (size_t n = 0; n < N; n++) {
166166
auto index = m * N + n;
@@ -491,7 +491,6 @@ int main(int argc, char** argv)
491491
op.add<popl::Switch>("", "wallclock", "Measure Wallclock Time", &wallclock);
492492
op.add<popl::Switch>("", "skipinit", "Do Not Initialize Buffers", &skipinit);
493493
op.add<popl::Switch>("", "roundrobin", "Use Round Robin Scheduling", &roundRobin);
494-
op.add<popl::Value<float>>("", "threshold", "Local Error Threshold", threshold, &threshold);
495494
op.add<popl::Value<size_t>, popl::Attribute::advanced>("", "mask", "Test Mask", mask, &mask);
496495
bool printUsage = false;
497496
try {

samples/20_matrixexperiments-tf32/main.cpp

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,10 +10,12 @@
1010

1111
#include <algorithm>
1212
#include <chrono>
13+
#include <cmath>
14+
#include <cstdint>
1315
#include <iostream>
16+
#include <random>
1417
#include <sstream>
1518
#include <string>
16-
#include <random>
1719
#include <vector>
1820

1921
#include "util.hpp"

0 commit comments

Comments
 (0)