diff options
| author | Marc Tiehuis <marc@tiehu.is> | 2019-08-21 20:46:15 +1200 |
|---|---|---|
| committer | Marc Tiehuis <marc@tiehu.is> | 2019-08-21 20:46:15 +1200 |
| commit | 48410943cbcbf53ae3c9895b2452218d6eacbc4b (patch) | |
| tree | 7bc17655da80359c234584ed45289471cb727194 | |
| parent | c050ec4e570caf53be924bcbbe4194512b6a022c (diff) | |
| download | zig-48410943cbcbf53ae3c9895b2452218d6eacbc4b.tar.gz zig-48410943cbcbf53ae3c9895b2452218d6eacbc4b.zip | |
Add more hash functions to benchmark scripts
Changed CRC api so the polynomial is specified as an enum for simpler
construction.
| -rw-r--r-- | std/hash/benchmark.zig | 90 | ||||
| -rw-r--r-- | std/hash/crc.zig | 26 |
2 files changed, 86 insertions, 30 deletions
diff --git a/std/hash/benchmark.zig b/std/hash/benchmark.zig index b42a34ef31..ca948d21bf 100644 --- a/std/hash/benchmark.zig +++ b/std/hash/benchmark.zig @@ -15,6 +15,7 @@ var prng = std.rand.DefaultPrng.init(0); const Hash = struct { ty: type, name: []const u8, + has_iterative_api: bool = true, init_u8s: ?[]const u8 = null, init_u64: ?u64 = null, }; @@ -22,11 +23,62 @@ const Hash = struct { const siphash_key = "0123456789abcdef"; const hashes = [_]Hash{ - Hash{ .ty = hash.Wyhash, .name = "wyhash", .init_u64 = 0 }, - Hash{ .ty = hash.SipHash64(1, 3), .name = "siphash(1,3)", .init_u8s = siphash_key }, - Hash{ .ty = hash.SipHash64(2, 4), .name = "siphash(2,4)", .init_u8s = siphash_key }, - Hash{ .ty = hash.Fnv1a_64, .name = "fnv1a" }, - Hash{ .ty = hash.Crc32, .name = "crc32" }, + Hash{ + .ty = hash.Wyhash, + .name = "wyhash", + .init_u64 = 0, + }, + Hash{ + .ty = hash.SipHash64(1, 3), + .name = "siphash(1,3)", + .init_u8s = siphash_key, + }, + Hash{ + .ty = hash.SipHash64(2, 4), + .name = "siphash(2,4)", + .init_u8s = siphash_key, + }, + Hash{ + .ty = hash.Fnv1a_64, + .name = "fnv1a", + }, + Hash{ + .ty = hash.Adler32, + .name = "adler32", + }, + Hash{ + .ty = hash.crc.Crc32WithPoly(.IEEE), + .name = "crc32-slicing-by-8", + }, + Hash{ + .ty = hash.crc.Crc32SmallWithPoly(.IEEE), + .name = "crc32-half-byte-lookup", + }, + Hash{ + .ty = hash.CityHash32, + .name = "cityhash-32", + .has_iterative_api = false, + }, + Hash{ + .ty = hash.CityHash64, + .name = "cityhash-64", + .has_iterative_api = false, + }, + Hash{ + .ty = hash.Murmur2_32, + .name = "murmur2-32", + .has_iterative_api = false, + }, + Hash{ + .ty = hash.Murmur2_64, + .name = "murmur2-64", + .has_iterative_api = false, + }, + Hash{ + .ty = hash.Murmur3_32, + .name = "murmur3-32", + .has_iterative_api = false, + }, }; const Result = struct { @@ -78,10 +130,8 @@ pub fn benchmarkHashSmallKeys(comptime H: var, key_size: usize, bytes: usize) !R var sum: u64 = 0; while (i < key_count) : (i += 1) { - const o = i % (block_size - key_size); - const small_key = block[o .. key_size + o]; - - const result = blk: { + const small_key = block[0..key_size]; + sum +%= blk: { if (H.init_u8s) |init| { break :blk H.ty.hash(init, small_key); } @@ -90,8 +140,6 @@ pub fn benchmarkHashSmallKeys(comptime H: var, key_size: usize, bytes: usize) !R } break :blk H.ty.hash(small_key); }; - - sum +%= result; } const end = timer.read(); @@ -142,6 +190,7 @@ pub fn main() !void { var filter: ?[]u8 = ""; var count: usize = mode(128 * MiB); var key_size: usize = 32; + var seed: u32 = 0; var i: usize = 1; while (i < args.len) : (i += 1) { @@ -155,8 +204,8 @@ pub fn main() !void { std.os.exit(1); } - const seed = try std.fmt.parseUnsigned(u32, args[i], 10); - prng.seed(seed); + seed = try std.fmt.parseUnsigned(u32, args[i], 10); + // we seed later } else if (std.mem.eql(u8, args[i], "--filter")) { i += 1; if (i == args.len) { @@ -197,11 +246,18 @@ pub fn main() !void { inline for (hashes) |H| { if (filter == null or std.mem.indexOf(u8, H.name, filter.?) != null) { - const result = try benchmarkHash(H, count); - const result_small = try benchmarkHashSmallKeys(H, key_size, count); - try stdout.print("{}\n", H.name); - try stdout.print(" iterative: {:4} MiB/s [{x:0<16}]\n", result.throughput / (1 * MiB), result.hash); + + // Always reseed prior to every call so we are hashing the same buffer contents. + // This allows easier comparison between different implementations. + if (H.has_iterative_api) { + prng.seed(seed); + const result = try benchmarkHash(H, count); + try stdout.print(" iterative: {:4} MiB/s [{x:0<16}]\n", result.throughput / (1 * MiB), result.hash); + } + + prng.seed(seed); + const result_small = try benchmarkHashSmallKeys(H, key_size, count); try stdout.print(" small keys: {:4} MiB/s [{x:0<16}]\n", result_small.throughput / (1 * MiB), result_small.hash); } } diff --git a/std/hash/crc.zig b/std/hash/crc.zig index 53b4262c93..73e5bb0371 100644 --- a/std/hash/crc.zig +++ b/std/hash/crc.zig @@ -9,17 +9,17 @@ const std = @import("../std.zig"); const debug = std.debug; const testing = std.testing; -pub const Polynomial = struct { - const IEEE = 0xedb88320; - const Castagnoli = 0x82f63b78; - const Koopman = 0xeb31d82e; +pub const Polynomial = enum(u32) { + IEEE = 0xedb88320, + Castagnoli = 0x82f63b78, + Koopman = 0xeb31d82e, }; // IEEE is by far the most common CRC and so is aliased by default. -pub const Crc32 = Crc32WithPoly(Polynomial.IEEE); +pub const Crc32 = Crc32WithPoly(.IEEE); // slicing-by-8 crc32 implementation. -pub fn Crc32WithPoly(comptime poly: u32) type { +pub fn Crc32WithPoly(comptime poly: Polynomial) type { return struct { const Self = @This(); const lookup_tables = comptime block: { @@ -31,7 +31,7 @@ pub fn Crc32WithPoly(comptime poly: u32) type { var j: usize = 0; while (j < 8) : (j += 1) { if (crc & 1 == 1) { - crc = (crc >> 1) ^ poly; + crc = (crc >> 1) ^ @enumToInt(poly); } else { crc = (crc >> 1); } @@ -100,7 +100,7 @@ pub fn Crc32WithPoly(comptime poly: u32) type { } test "crc32 ieee" { - const Crc32Ieee = Crc32WithPoly(Polynomial.IEEE); + const Crc32Ieee = Crc32WithPoly(.IEEE); testing.expect(Crc32Ieee.hash("") == 0x00000000); testing.expect(Crc32Ieee.hash("a") == 0xe8b7be43); @@ -108,7 +108,7 @@ test "crc32 ieee" { } test "crc32 castagnoli" { - const Crc32Castagnoli = Crc32WithPoly(Polynomial.Castagnoli); + const Crc32Castagnoli = Crc32WithPoly(.Castagnoli); testing.expect(Crc32Castagnoli.hash("") == 0x00000000); testing.expect(Crc32Castagnoli.hash("a") == 0xc1d04330); @@ -116,7 +116,7 @@ test "crc32 castagnoli" { } // half-byte lookup table implementation. -pub fn Crc32SmallWithPoly(comptime poly: u32) type { +pub fn Crc32SmallWithPoly(comptime poly: Polynomial) type { return struct { const Self = @This(); const lookup_table = comptime block: { @@ -127,7 +127,7 @@ pub fn Crc32SmallWithPoly(comptime poly: u32) type { var j: usize = 0; while (j < 8) : (j += 1) { if (crc & 1 == 1) { - crc = (crc >> 1) ^ poly; + crc = (crc >> 1) ^ @enumToInt(poly); } else { crc = (crc >> 1); } @@ -164,7 +164,7 @@ pub fn Crc32SmallWithPoly(comptime poly: u32) type { } test "small crc32 ieee" { - const Crc32Ieee = Crc32SmallWithPoly(Polynomial.IEEE); + const Crc32Ieee = Crc32SmallWithPoly(.IEEE); testing.expect(Crc32Ieee.hash("") == 0x00000000); testing.expect(Crc32Ieee.hash("a") == 0xe8b7be43); @@ -172,7 +172,7 @@ test "small crc32 ieee" { } test "small crc32 castagnoli" { - const Crc32Castagnoli = Crc32SmallWithPoly(Polynomial.Castagnoli); + const Crc32Castagnoli = Crc32SmallWithPoly(.Castagnoli); testing.expect(Crc32Castagnoli.hash("") == 0x00000000); testing.expect(Crc32Castagnoli.hash("a") == 0xc1d04330); |
