diff --git a/docs/benchmarks/tokenizer/10000_lines.svg b/docs/benchmarks/tokenizer/10000_lines.svg
new file mode 100644
index 000000000..7c2b11558
--- /dev/null
+++ b/docs/benchmarks/tokenizer/10000_lines.svg
@@ -0,0 +1,610 @@
+
+
diff --git a/docs/benchmarks/tokenizer/10000_lines.txt b/docs/benchmarks/tokenizer/10000_lines.txt
new file mode 100644
index 000000000..87e2665b9
--- /dev/null
+++ b/docs/benchmarks/tokenizer/10000_lines.txt
@@ -0,0 +1,9 @@
+------------------------------------------------------------------------------------------- benchmark: 5 tests -------------------------------------------------------------------------------------------
+Name (time in ms) Min Max Mean StdDev Median IQR Outliers OPS Rounds Iterations
+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+test_json_file_10000_lines 35.1458 (1.0) 42.3855 (1.10) 35.9227 (1.0) 1.6084 (2.81) 35.3149 (1.0) 0.6377 (4.43) 2;2 27.8375 (1.0) 28 1
+test_yaml_file_10000_lines 36.3607 (1.03) 38.5070 (1.0) 36.7285 (1.02) 0.5724 (1.0) 36.5422 (1.03) 0.1438 (1.0) 3;3 27.2268 (0.98) 26 1
+test_javascript_source_10000_lines 42.4648 (1.21) 57.9463 (1.50) 44.3093 (1.23) 3.8546 (6.73) 42.6463 (1.21) 1.0546 (7.33) 3;4 22.5686 (0.81) 22 1
+test_python_source_10000_lines 45.1904 (1.29) 49.2031 (1.28) 45.8314 (1.28) 1.1117 (1.94) 45.3827 (1.29) 0.2863 (1.99) 2;4 21.8191 (0.78) 22 1
+test_xml_file_10000_lines 150.8377 (4.29) 154.2563 (4.01) 151.8601 (4.23) 1.3659 (2.39) 151.4022 (4.29) 1.0826 (7.53) 1;1 6.5850 (0.24) 5 1
+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
diff --git a/docs/benchmarks/tokenizer/1000_lines.svg b/docs/benchmarks/tokenizer/1000_lines.svg
new file mode 100644
index 000000000..557e0f1db
--- /dev/null
+++ b/docs/benchmarks/tokenizer/1000_lines.svg
@@ -0,0 +1,665 @@
+
+
diff --git a/docs/benchmarks/tokenizer/1000_lines.txt b/docs/benchmarks/tokenizer/1000_lines.txt
new file mode 100644
index 000000000..53e8fdbe3
--- /dev/null
+++ b/docs/benchmarks/tokenizer/1000_lines.txt
@@ -0,0 +1,10 @@
+----------------------------------------------------------------------------------------- benchmark: 6 tests -----------------------------------------------------------------------------------------
+Name (time in ms) Min Max Mean StdDev Median IQR Outliers OPS Rounds Iterations
+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+test_json_file_1000_lines 3.4195 (1.0) 4.2138 (1.01) 3.4932 (1.00) 0.1289 (1.53) 3.4506 (1.0) 0.0370 (1.14) 20;27 286.2730 (1.00) 247 1
+test_yaml_file_1000_lines 3.4353 (1.00) 4.1749 (1.0) 3.4841 (1.0) 0.0841 (1.0) 3.4651 (1.00) 0.0325 (1.0) 10;16 287.0144 (1.0) 273 1
+test_python_source_1000_lines 3.5137 (1.03) 4.3616 (1.04) 3.6713 (1.05) 0.2171 (2.58) 3.5603 (1.03) 0.1787 (5.49) 42;33 272.3858 (0.95) 250 1
+test_javascript_source_1000_lines 3.8670 (1.13) 4.8750 (1.17) 4.0406 (1.16) 0.2360 (2.80) 3.9243 (1.14) 0.1752 (5.39) 35;31 247.4853 (0.86) 208 1
+test_xml_file_1000_lines 14.5713 (4.26) 18.0922 (4.33) 14.7514 (4.23) 0.4419 (5.25) 14.6636 (4.25) 0.0985 (3.03) 2;8 67.7901 (0.24) 67 1
+test_lorem_ipsum_times_1000_times 40.9866 (11.99) 41.9590 (10.05) 41.6153 (11.94) 0.4594 (5.46) 41.8791 (12.14) 0.8625 (26.52) 2;0 24.0296 (0.08) 6 1
+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
diff --git a/docs/benchmarks/tokenizer/100_lines.svg b/docs/benchmarks/tokenizer/100_lines.svg
new file mode 100644
index 000000000..6cc9b61f4
--- /dev/null
+++ b/docs/benchmarks/tokenizer/100_lines.svg
@@ -0,0 +1,660 @@
+
+
diff --git a/docs/benchmarks/tokenizer/100_lines.txt b/docs/benchmarks/tokenizer/100_lines.txt
new file mode 100644
index 000000000..d3c4c1945
--- /dev/null
+++ b/docs/benchmarks/tokenizer/100_lines.txt
@@ -0,0 +1,10 @@
+------------------------------------------------------------------------------------------------- benchmark: 6 tests ------------------------------------------------------------------------------------------------
+Name (time in us) Min Max Mean StdDev Median IQR Outliers OPS Rounds Iterations
+---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+test_python_source_100_lines 242.5400 (1.0) 359.4250 (1.0) 255.1634 (1.0) 19.5716 (1.69) 247.1790 (1.0) 10.6970 (2.36) 263;281 3,919.0570 (1.0) 2380 1
+test_json_file_100_lines 380.9340 (1.57) 779.3030 (2.17) 389.2734 (1.53) 11.5771 (1.0) 387.2705 (1.57) 5.6260 (1.24) 176;213 2,568.8884 (0.66) 2094 1
+test_javascript_source_100_lines 381.1490 (1.57) 943.9490 (2.63) 389.5003 (1.53) 15.1875 (1.31) 387.4350 (1.57) 4.5335 (1.0) 100;160 2,567.3921 (0.66) 1815 1
+test_yaml_file_100_lines 398.1340 (1.64) 989.9450 (2.75) 405.5441 (1.59) 14.2924 (1.23) 404.0920 (1.63) 5.1420 (1.13) 81;143 2,465.8228 (0.63) 1966 1
+test_xml_file_100_lines 1,545.7790 (6.37) 1,859.1840 (5.17) 1,572.3290 (6.16) 22.9494 (1.98) 1,567.0090 (6.34) 14.5047 (3.20) 46;37 635.9992 (0.16) 539 1
+test_lorem_ipsum_times_100_times 4,061.0170 (16.74) 4,152.4630 (11.55) 4,093.7268 (16.04) 32.8167 (2.83) 4,087.8280 (16.54) 46.5311 (10.26) 2;0 244.2762 (0.06) 8 1
+---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
diff --git a/docs/benchmarks/tokenizer/10_lines.svg b/docs/benchmarks/tokenizer/10_lines.svg
new file mode 100644
index 000000000..b19336c1f
--- /dev/null
+++ b/docs/benchmarks/tokenizer/10_lines.svg
@@ -0,0 +1,620 @@
+
+
diff --git a/docs/benchmarks/tokenizer/10_lines.txt b/docs/benchmarks/tokenizer/10_lines.txt
new file mode 100644
index 000000000..431c0d664
--- /dev/null
+++ b/docs/benchmarks/tokenizer/10_lines.txt
@@ -0,0 +1,10 @@
+-------------------------------------------------------------------------------------------- benchmark: 6 tests --------------------------------------------------------------------------------------------
+Name (time in us) Min Max Mean StdDev Median IQR Outliers OPS (Kops/s) Rounds Iterations
+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
+test_python_source_10_lines 22.8470 (1.0) 56.1720 (1.0) 23.6609 (1.0) 0.8214 (1.0) 23.4740 (1.0) 0.3405 (1.0) 1027;1437 42.2638 (1.0) 14104 1
+test_javascript_source_10_lines 42.5120 (1.86) 596.0850 (10.61) 43.7448 (1.85) 5.7926 (7.05) 43.4260 (1.85) 0.4999 (1.47) 15;860 22.8599 (0.54) 9397 1
+test_json_file_10_lines 43.7800 (1.92) 111.4280 (1.98) 45.6973 (1.93) 2.4697 (3.01) 45.0140 (1.92) 0.6990 (2.05) 874;1562 21.8831 (0.52) 11274 1
+test_yaml_file_10_lines 44.3640 (1.94) 66.0510 (1.18) 45.8708 (1.94) 1.2791 (1.56) 45.4090 (1.93) 0.7530 (2.21) 1667;1751 21.8004 (0.52) 10432 1
+test_xml_file_10_lines 116.3430 (5.09) 684.6800 (12.19) 124.4895 (5.26) 8.5224 (10.38) 123.6365 (5.27) 1.6230 (4.77) 20;529 8.0328 (0.19) 4610 1
+test_lorem_ipsum_times_10_times 412.0250 (18.03) 443.5790 (7.90) 421.8986 (17.83) 9.7967 (11.93) 421.4340 (17.95) 8.1905 (24.05) 2;1 2.3702 (0.06) 8 1
+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
diff --git a/docs/benchmarks/tokenizer/all.svg b/docs/benchmarks/tokenizer/all.svg
index ed9880640..a437a492b 100644
--- a/docs/benchmarks/tokenizer/all.svg
+++ b/docs/benchmarks/tokenizer/all.svg
@@ -1,14 +1,14 @@
-