1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115
use std::mem; fn fmix32(mut h: u32) -> u32 { h ^= h >> 16; h = h.wrapping_mul(0x85ebca6b); h ^= h >> 13; h = h.wrapping_mul(0xc2b2ae35); h ^= h >> 16; return h; } fn get_32_block(bytes: &[u8], index: usize) -> u32 { let b32: &[u32] = unsafe { mem::transmute(bytes) }; return b32[index]; } pub fn murmurhash3_x86_32(bytes: &[u8], seed: u32) -> u32 { let c1 = 0xcc9e2d51u32; let c2 = 0x1b873593u32; let read_size = 4; let len = bytes.len() as u32; let block_count = len / read_size; let mut h1 = seed; for i in 0..block_count as usize { let mut k1 = get_32_block(bytes, i); k1 = k1.wrapping_mul(c1); k1 = k1.rotate_left(15); k1 = k1.wrapping_mul(c2); h1 ^= k1; h1 = h1.rotate_left(13); h1 = h1.wrapping_mul(5); h1 = h1.wrapping_add(0xe6546b64) } let mut k1 = 0u32; if len & 3 == 3 { k1 ^= (bytes[(block_count * read_size) as usize + 2] as u32) << 16; } if len & 3 >= 2 { k1 ^= (bytes[(block_count * read_size) as usize + 1] as u32) << 8; } if len & 3 >= 1 { k1 ^= bytes[(block_count * read_size) as usize + 0] as u32; k1 = k1.wrapping_mul(c1); k1 = k1.rotate_left(15); k1 = k1.wrapping_mul(c2); h1 ^= k1; } h1 ^= bytes.len() as u32; h1 = fmix32(h1); return h1; } #[cfg(test)] mod test { use super::murmurhash3_x86_32; #[test] fn test_empty_string() { assert!(murmurhash3_x86_32("".as_bytes(), 0) == 0); } #[test] fn test_tail_lengths() { assert!(murmurhash3_x86_32("1".as_bytes(), 0) == 2484513939); assert!(murmurhash3_x86_32("12".as_bytes(), 0) == 4191350549); assert!(murmurhash3_x86_32("123".as_bytes(), 0) == 2662625771); assert!(murmurhash3_x86_32("1234".as_bytes(), 0) == 1914461635); } #[test] fn test_large_data() { assert!(murmurhash3_x86_32("Lorem ipsum dolor sit amet, consectetur adipiscing elit. Etiam at consequat massa. Cras eleifend pellentesque ex, at dignissim libero maximus ut. Sed eget nulla felis".as_bytes(), 0) == 1004899618); } #[cfg(feature="nightly")] mod bench { extern crate rand; extern crate test; use std::iter::FromIterator; use self::rand::Rng; use self::test::{Bencher, black_box}; use super::super::murmurhash3_x86_32; fn run_bench(b: &mut Bencher, size: u64) { let mut data: Vec<u8> = FromIterator::from_iter((0..size).map(|_| 0u8)); rand::thread_rng().fill_bytes(&mut data); b.bytes = size; b.iter(|| { black_box(murmurhash3_x86_32(&data, 0)); }); } #[bench] fn bench_random_256k(b: &mut Bencher) { run_bench(b, 256 * 1024); } #[bench] fn bench_random_16b(b: &mut Bencher) { run_bench(b, 16); } } }