|
| 1 | +package datadog.trace.util; |
| 2 | + |
| 3 | +import java.util.HashMap; |
| 4 | +import java.util.TreeMap; |
| 5 | +import java.util.concurrent.ThreadLocalRandom; |
| 6 | +import java.util.function.Supplier; |
| 7 | + |
| 8 | +import org.openjdk.jmh.annotations.Benchmark; |
| 9 | +import org.openjdk.jmh.annotations.Fork; |
| 10 | +import org.openjdk.jmh.annotations.Measurement; |
| 11 | +import org.openjdk.jmh.annotations.Threads; |
| 12 | +import org.openjdk.jmh.annotations.Warmup; |
| 13 | +import org.openjdk.jmh.infra.Blackhole; |
| 14 | + |
| 15 | +/** |
| 16 | + * <ul>Benchmark to illustrate the trade-offs around case-insensitive Map look-ups - using either... |
| 17 | + * <li>(RECOMMENDED) TreeMap with Comparator of String::compareToIgnoreCase |
| 18 | + * <li>HashMap with look-ups using String::to<X>Case |
| 19 | + * </ul> |
| 20 | + * |
| 21 | + * <p>For case-insensitive lookups, TreeMap map creation is consistently faster because it |
| 22 | + * avoids String::to<X>Case calls. |
| 23 | + * |
| 24 | + * <p>Despite calls to String::to<X>Case, HashMap lookups are faster in single threaded |
| 25 | + * microbenchmark by 50% but are worse when frequently called in a multi-threaded system. |
| 26 | + * |
| 27 | + * <p>With many threads, the extra allocation from calling String::to<X>Case leads to frequent GCs |
| 28 | + * which has adverse impacts on the whole system. |
| 29 | + * |
| 30 | + * <code> |
| 31 | + * MacBook M1 with 1 thread (Java 21) |
| 32 | + * |
| 33 | + * Benchmark Mode Cnt Score Error Units |
| 34 | + * CaseInsensitiveMapBenchmark.create_hashMap thrpt 6 994213.041 ± 15718.903 ops/s |
| 35 | + * CaseInsensitiveMapBenchmark.create_treeMap thrpt 6 1522900.015 ± 21646.688 ops/s |
| 36 | + * |
| 37 | + * CaseInsensitiveMapBenchmark.get_hashMap thrpt 6 69149862.293 ± 9168648.566 ops/s |
| 38 | + * CaseInsensitiveMapBenchmark.get_treeMap thrpt 6 42796699.230 ± 9029447.805 ops/s |
| 39 | + * </code> |
| 40 | + * |
| 41 | + * <code> |
| 42 | + * MacBook M1 with 8 threads (Java 21) |
| 43 | + * |
| 44 | + * Benchmark Mode Cnt Score Error Units |
| 45 | + * CaseInsensitiveMapBenchmark.create_hashMap thrpt 6 6641003.483 ± 543210.409 ops/s |
| 46 | + * CaseInsensitiveMapBenchmark.create_treeMap thrpt 6 10030191.764 ± 1308865.113 ops/s |
| 47 | + * |
| 48 | + * CaseInsensitiveMapBenchmark.get_hashMap thrpt 6 38748031.837 ± 9012072.804 ops/s |
| 49 | + * CaseInsensitiveMapBenchmark.get_treeMap thrpt 6 173495470.789 ± 27824904.999 ops/s |
| 50 | + * </code> |
| 51 | + */ |
| 52 | +@Fork(2) |
| 53 | +@Warmup(iterations=2) |
| 54 | +@Measurement(iterations=3) |
| 55 | +@Threads(8) |
| 56 | +public class CaseInsensitiveMapBenchmark { |
| 57 | + static final String[] PREFIXES = { |
| 58 | + "foo", |
| 59 | + "bar", |
| 60 | + "baz", |
| 61 | + "quux" |
| 62 | + }; |
| 63 | + |
| 64 | + static final int NUM_SUFFIXES = 4; |
| 65 | + |
| 66 | + static <T> T init(Supplier<T> supplier) { |
| 67 | + return supplier.get(); |
| 68 | + } |
| 69 | + |
| 70 | + static final String[] UPPER_PREFIXES = init(() -> { |
| 71 | + String[] upperPrefixes = new String[PREFIXES.length]; |
| 72 | + for ( int i = 0; i < PREFIXES.length; ++i ) { |
| 73 | + upperPrefixes[i] = PREFIXES[i].toUpperCase(); |
| 74 | + } |
| 75 | + return upperPrefixes; |
| 76 | + }); |
| 77 | + |
| 78 | + static final String[] LOOKUP_KEYS = init(() -> { |
| 79 | + ThreadLocalRandom curRandom = ThreadLocalRandom.current(); |
| 80 | + |
| 81 | + String[] keys = new String[32]; |
| 82 | + for ( int i = 0; i < keys.length; ++i ) { |
| 83 | + int prefixIndex = curRandom.nextInt(PREFIXES.length); |
| 84 | + boolean toUpper = curRandom.nextBoolean(); |
| 85 | + int suffixIndex = curRandom.nextInt(NUM_SUFFIXES + 1); |
| 86 | + |
| 87 | + String key = PREFIXES[prefixIndex] + "-" + suffixIndex; |
| 88 | + keys[i] = toUpper ? key.toUpperCase() : key.toLowerCase(); |
| 89 | + } |
| 90 | + return keys; |
| 91 | + }); |
| 92 | + |
| 93 | + static int sharedLookupIndex = 0; |
| 94 | + |
| 95 | + static String nextLookupKey() { |
| 96 | + int localIndex = ++sharedLookupIndex; |
| 97 | + if ( localIndex >= LOOKUP_KEYS.length ) { |
| 98 | + sharedLookupIndex = localIndex = 0; |
| 99 | + } |
| 100 | + return LOOKUP_KEYS[localIndex]; |
| 101 | + } |
| 102 | + |
| 103 | + @Benchmark |
| 104 | + public void create_baseline(Blackhole blackhole) { |
| 105 | + for ( int suffix = 0; suffix < NUM_SUFFIXES; ++suffix ) { |
| 106 | + for ( String prefix: PREFIXES ) { |
| 107 | + blackhole.consume(prefix + "-" + suffix); |
| 108 | + blackhole.consume(Integer.valueOf(suffix)); |
| 109 | + } |
| 110 | + } |
| 111 | + for ( int suffix = 0; suffix < NUM_SUFFIXES; suffix +=2 ) { |
| 112 | + for ( String prefix: UPPER_PREFIXES ) { |
| 113 | + blackhole.consume(prefix + "-" + suffix); |
| 114 | + blackhole.consume(Integer.valueOf(suffix + 1)); |
| 115 | + } |
| 116 | + } |
| 117 | + } |
| 118 | + |
| 119 | + @Benchmark |
| 120 | + public void lookup_baseline(Blackhole blackhole) { |
| 121 | + blackhole.consume(nextLookupKey()); |
| 122 | + } |
| 123 | + |
| 124 | + @Benchmark |
| 125 | + public HashMap<String, Integer> create_hashMap() { |
| 126 | + return _create_hashMap(); |
| 127 | + } |
| 128 | + |
| 129 | + static HashMap<String, Integer> _create_hashMap() { |
| 130 | + HashMap<String, Integer> map = new HashMap<>(); |
| 131 | + for ( int suffix = 0; suffix < NUM_SUFFIXES; ++suffix ) { |
| 132 | + for ( String prefix: PREFIXES ) { |
| 133 | + map.put((prefix + "-" + suffix).toLowerCase(), suffix); // arguable, but real caller probably doesn't know the case ahead-of-time |
| 134 | + } |
| 135 | + } |
| 136 | + for ( int suffix = 0; suffix < NUM_SUFFIXES; suffix +=2 ) { |
| 137 | + for ( String prefix: UPPER_PREFIXES ) { |
| 138 | + map.put((prefix + "-" + suffix).toLowerCase(), suffix + 1); |
| 139 | + } |
| 140 | + } |
| 141 | + return map; |
| 142 | + } |
| 143 | + |
| 144 | + static final HashMap<String, Integer> HASH_MAP = _create_hashMap(); |
| 145 | + |
| 146 | + @Benchmark |
| 147 | + public Integer lookup_hashMap() { |
| 148 | + // This benchmark is still "correct" in multi-threaded context, |
| 149 | + // Map is populated under the class initialization lock and not changed thereafter |
| 150 | + return HASH_MAP.get(nextLookupKey().toLowerCase()); |
| 151 | + } |
| 152 | + |
| 153 | + @Benchmark |
| 154 | + public TreeMap<String, Integer> create_treeMap() { |
| 155 | + return _create_treeMap(); |
| 156 | + } |
| 157 | + |
| 158 | + static TreeMap<String, Integer> _create_treeMap() { |
| 159 | + TreeMap<String, Integer> map = new TreeMap<>(String::compareToIgnoreCase); |
| 160 | + for ( int suffix = 0; suffix < NUM_SUFFIXES; ++suffix ) { |
| 161 | + for ( String prefix: PREFIXES ) { |
| 162 | + map.put(prefix + "-" + suffix, suffix); |
| 163 | + } |
| 164 | + } |
| 165 | + for ( int suffix = 0; suffix < NUM_SUFFIXES; suffix +=2 ) { |
| 166 | + for ( String prefix: UPPER_PREFIXES ) { |
| 167 | + map.put(prefix + "-" + suffix, suffix + 1); |
| 168 | + } |
| 169 | + } |
| 170 | + return map; |
| 171 | + } |
| 172 | + |
| 173 | + static final TreeMap<String, Integer> TREE_MAP = _create_treeMap(); |
| 174 | + |
| 175 | + @Benchmark |
| 176 | + public Integer lookup_treeMap() { |
| 177 | + // This benchmark is still "correct" in multi-threaded context, |
| 178 | + // Map is populated under the initial class initialization lock and not changed thereafter |
| 179 | + return TREE_MAP.get(nextLookupKey()); |
| 180 | + } |
| 181 | + |
| 182 | + // TODO: Add ConcurrentSkipListMap & synchronized HashMap & TreeMap |
| 183 | +} |
0 commit comments