Add initial version of performance measurement

michalharakal · michalharakal · commit 73fd383f9f87 · 2025-09-15T12:54:42.000+02:00
Related-To: #36
diff --git a/docs/modules/performance/nav.adoc b/docs/modules/performance/nav.adoc
@@ -0,0 +1,4 @@
+* xref:index.adoc[Performance Measurement]
+** xref:benchmark-framework.adoc[Benchmark Framework]
+** xref:performance-testing.adoc[Performance Testing Guide]
+** xref:metrics-analysis.adoc[Metrics and Analysis]
diff --git a/docs/modules/performance/pages/index.adoc b/docs/modules/performance/pages/index.adoc
@@ -0,0 +1,70 @@
+= Performance Measurement Framework
+:toc:
+:toclevels: 3
+:sectanchors:
+:sectlinks:
+
+The SKaiNET Performance Measurement Framework provides comprehensive tools for benchmarking tensor operations and analyzing computational performance across different backends and configurations.
+
+== Overview
+
+The performance measurement framework is designed to:
+
+* Measure execution time and throughput of tensor operations
+* Compare performance between different compute backends
+* Provide statistical analysis of benchmark results
+* Generate detailed performance reports
+* Support multiplatform benchmarking
+
+== Key Components
+
+=== BenchmarkRunner
+
+The `BenchmarkRunner` class is the core component that executes performance measurements:
+
+[source,kotlin]
+----
+val runner = BenchmarkRunner()
+val result = runner.benchmark(
+    name = "Matrix Multiplication 256x256",
+    warmupRuns = 10,
+    measurementRuns = 100
+) {
+    // Your operation to benchmark
+    backend.matmul(matrixA, matrixB)
+}
+----
+
+=== Benchmark Results
+
+The framework provides comprehensive result analysis:
+
+* **TimeStatistics**: Mean, median, standard deviation, min/max execution times
+* **MemoryStatistics**: Memory usage tracking (platform-dependent)
+* **BenchmarkResult**: Complete benchmark results with metadata
+* **BenchmarkReport**: Comprehensive reports for multiple operations
+
+=== Performance Analysis
+
+Advanced analysis capabilities include:
+
+* Statistical analysis of execution times
+* Throughput calculations (operations per second)
+* Performance comparison between backends
+* Speedup analysis and regression detection
+
+== Quick Start
+
+. Add the performance module dependency to your test configuration
+. Create a `BenchmarkRunner` instance
+. Use the `benchmark()` method to measure your operations
+. Analyze results using the provided data classes
+
+== Module Structure
+
+The performance module (`skainet-core:skainet-performance`) contains:
+
+* Core benchmarking infrastructure
+* Result analysis and reporting tools
+* Statistical utilities
+* Multiplatform compatibility layer
diff --git a/skainet-core/skainet-performance/build.gradle.kts b/skainet-core/skainet-performance/build.gradle.kts
@@ -0,0 +1,59 @@
+import org.jetbrains.kotlin.gradle.ExperimentalKotlinGradlePluginApi
+import org.jetbrains.kotlin.gradle.ExperimentalWasmDsl
+import org.jetbrains.kotlin.gradle.dsl.JvmTarget
+
+plugins {
+    alias(libs.plugins.kotlinMultiplatform)
+    alias(libs.plugins.androidLibrary)
+    alias(libs.plugins.vanniktech.mavenPublish)
+}
+
+kotlin {
+    explicitApi()
+
+    androidTarget {
+        @OptIn(ExperimentalKotlinGradlePluginApi::class)
+        compilerOptions {
+            jvmTarget.set(JvmTarget.JVM_11)
+        }
+    }
+
+    iosArm64()
+    iosSimulatorArm64()
+    macosArm64 ()
+    linuxX64 ()
+    linuxArm64 ()
+
+    jvm()
+
+    @OptIn(ExperimentalWasmDsl::class)
+    wasmJs {
+        browser()
+        binaries.executable()
+    }
+
+    sourceSets {
+        val commonMain by getting {
+            dependencies {
+                implementation(project(":skainet-core:skainet-tensors-api"))
+            }
+        }
+
+        commonTest.dependencies {
+            implementation(libs.kotlin.test)
+        }
+    }
+}
+
+android {
+    namespace = "sk.ai.net.core.performance"
+    compileSdk = libs.versions.android.compileSdk.get().toInt()
+
+    defaultConfig {
+        minSdk = libs.versions.android.minSdk.get().toInt()
+    }
+    compileOptions {
+        sourceCompatibility = JavaVersion.VERSION_11
+        targetCompatibility = JavaVersion.VERSION_11
+    }
+}
diff --git a/skainet-core/skainet-performance/gradle.properties b/skainet-core/skainet-performance/gradle.properties
@@ -0,0 +1,3 @@
+POM_ARTIFACT_ID=skainet-performance
+POM_NAME=SKaiNET Performance Measurement Framework
+POM_DESCRIPTION=Core performance measurement and benchmarking utilities for SKaiNET tensor operations
diff --git a/skainet-core/skainet-performance/src/commonMain/kotlin/sk/ainet/core/performance/BenchmarkResult.kt b/skainet-core/skainet-performance/src/commonMain/kotlin/sk/ainet/core/performance/BenchmarkResult.kt
@@ -0,0 +1,182 @@
+package sk.ainet.core.performance
+
+/**
+ * Comprehensive benchmark result containing timing statistics
+ */
+public data class BenchmarkResult(
+    val name: String,
+    val executionTime: TimeStatistics,
+    val memoryUsage: MemoryStatistics,
+    val throughput: Double, // operations per second
+    val metadata: Map<String, Any>
+) {
+    public fun prettyPrint(): String {
+        return buildString {
+            appendLine("$name:")
+            appendLine("  Time: ${(executionTime.mean / 1000).format(3)}ms ± ${(executionTime.standardDeviation / 1000).format(3)}ms")
+            appendLine("  Throughput: ${throughput.format(1)} ops/sec")
+            appendLine("  Memory: ${formatBytes(memoryUsage.allocatedBytes)}")
+            appendLine("  Range: ${(executionTime.min / 1000).format(3)}ms - ${(executionTime.max / 1000).format(3)}ms")
+        }
+    }
+    
+    private fun formatBytes(bytes: Long): String {
+        return when {
+            bytes >= 1_000_000 -> "${(bytes / 1_000_000.0).format(1)}MB"
+            bytes >= 1_000 -> "${(bytes / 1_000.0).format(1)}KB"
+            else -> "${bytes}B"
+        }
+    }
+    
+    private fun Double.format(decimals: Int): String {
+        val multiplier = when (decimals) {
+            0 -> 1.0
+            1 -> 10.0
+            2 -> 100.0
+            3 -> 1000.0
+            else -> 1000.0
+        }
+        val rounded = (this * multiplier).toInt() / multiplier
+        return rounded.toString()
+    }
+}
+
+/**
+ * Statistical analysis of execution times
+ */
+public data class TimeStatistics(
+    val mean: Double, // microseconds
+    val median: Double, // microseconds
+    val standardDeviation: Double, // microseconds
+    val min: Double, // microseconds
+    val max: Double, // microseconds
+    val percentile95: Double // microseconds
+)
+
+/**
+ * Memory usage statistics (placeholder for multiplatform compatibility)
+ */
+public data class MemoryStatistics(
+    val allocatedBytes: Long,
+    val peakHeapUsage: Long,
+    val gcCollections: Int,
+    val gcTime: Long // milliseconds
+)
+
+/**
+ * Comprehensive benchmark report containing all operation results
+ */
+public data class BenchmarkReport(
+    val backendName: String,
+    val matrixMultiplication: List<BenchmarkResult>,
+    val elementwiseOperations: Map<String, List<BenchmarkResult>>,
+    val dotProduct: List<BenchmarkResult>,
+    val scalarOperations: Map<String, List<BenchmarkResult>>,
+    val summary: BenchmarkSummary
+) {
+    public fun prettyPrint(): String {
+        return buildString {
+            appendLine("=" .repeat(50))
+            appendLine("TENSOR BENCHMARK REPORT - $backendName")
+            appendLine("=" .repeat(50))
+            appendLine()
+            
+            appendLine("MATRIX MULTIPLICATION:")
+            matrixMultiplication.forEach { result ->
+                appendLine(result.prettyPrint())
+            }
+            appendLine()
+            
+            appendLine("ELEMENT-WISE OPERATIONS:")
+            elementwiseOperations.forEach { (opType, results) ->
+                appendLine("  $opType:")
+                results.forEach { result ->
+                    appendLine("    ${result.prettyPrint().prependIndent("  ")}")
+                }
+            }
+            appendLine()
+            
+            appendLine("SUMMARY:")
+            appendLine("  Total Operations: ${summary.totalOperations}")
+            appendLine("  Average Throughput: ${summary.averageThroughput.format(1)} ops/sec")
+            appendLine("  Fastest: ${summary.fastestOperation}")
+            appendLine("  Slowest: ${summary.slowestOperation}")
+        }
+    }
+    
+    private fun Double.format(decimals: Int): String {
+        val multiplier = when (decimals) {
+            0 -> 1.0
+            1 -> 10.0
+            2 -> 100.0
+            3 -> 1000.0
+            else -> 1000.0
+        }
+        val rounded = (this * multiplier).toInt() / multiplier
+        return rounded.toString()
+    }
+}
+
+/**
+ * Summary statistics for a benchmark run
+ */
+public data class BenchmarkSummary(
+    val totalOperations: Int,
+    val averageThroughput: Double,
+    val fastestOperation: String,
+    val slowestOperation: String
+)
+
+/**
+ * Backend comparison report showing speedup analysis
+ */
+public data class ComparisonReport(
+    val baselineBackend: String,
+    val baselineResults: BenchmarkReport,
+    val comparisonBackend: String,
+    val comparisonResults: BenchmarkReport,
+    val speedupAnalysis: SpeedupAnalysis
+) {
+    public fun prettyPrint(): String {
+        return buildString {
+            appendLine("=" .repeat(60))
+            appendLine("BACKEND COMPARISON: $baselineBackend vs $comparisonBackend")
+            appendLine("=" .repeat(60))
+            appendLine()
+            
+            appendLine("SPEEDUP ANALYSIS:")
+            appendLine("  Average Speedup: ${speedupAnalysis.averageSpeedup.format(2)}x")
+            appendLine("  Best Case: ${speedupAnalysis.bestCaseSpeedup.format(2)}x")
+            appendLine("  Worst Case: ${speedupAnalysis.worstCaseSpeedup.format(2)}x")
+            appendLine()
+            
+            appendLine("DETAILED SPEEDUPS:")
+            speedupAnalysis.operationSpeedups.forEach { (operation, speedup) ->
+                appendLine("  $operation: ${speedup.format(2)}x")
+            }
+        }
+    }
+    
+    private fun Double.format(decimals: Int): String {
+        val multiplier = when (decimals) {
+            0 -> 1.0
+            1 -> 10.0
+            2 -> 100.0
+            3 -> 1000.0
+            else -> 1000.0
+        }
+        val rounded = (this * multiplier).toInt() / multiplier
+        return rounded.toString()
+    }
+}
+
+/**
+ * Speedup analysis comparing two backends
+ */
+public data class SpeedupAnalysis(
+    val operationSpeedups: Map<String, Double>,
+    val averageSpeedup: Double,
+    val bestCaseSpeedup: Double,
+    val worstCaseSpeedup: Double,
+    val speedupByTensorSize: Map<String, Double>
+)
diff --git a/skainet-core/skainet-performance/src/commonMain/kotlin/sk/ainet/core/performance/BenchmarkRunner.kt b/skainet-core/skainet-performance/src/commonMain/kotlin/sk/ainet/core/performance/BenchmarkRunner.kt

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+POM_ARTIFACT_ID=skainet-performance`
	`2`	`+POM_NAME=SKaiNET Performance Measurement Framework`
	`3`	`+POM_DESCRIPTION=Core performance measurement and benchmarking utilities for SKaiNET tensor operations`