diff --git a/src/libcollections/hash/mod.rs b/src/libcollections/hash/mod.rs
index c59de19e822cc..4bf598a7a6625 100644
--- a/src/libcollections/hash/mod.rs
+++ b/src/libcollections/hash/mod.rs
@@ -76,6 +76,7 @@ use vec::Vec;
 pub use self::sip::hash as hash;
 
 pub mod sip;
+pub mod xxh;
 
 /// A hashable type. The `S` type parameter is an abstract hash state that is
 /// used by the `Hash` to compute the hash. It defaults to
diff --git a/src/libcollections/hash/xxh.rs b/src/libcollections/hash/xxh.rs
new file mode 100644
index 0000000000000..bc80f550bb090
--- /dev/null
+++ b/src/libcollections/hash/xxh.rs
@@ -0,0 +1,515 @@
+// Copyright 2014 The Rust Project Developers. See the COPYRIGHT
+// file at the top-level directory of this distribution and at
+// http://rust-lang.org/COPYRIGHT.
+//
+// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
+// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
+// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
+// option. This file may not be copied, modified, or distributed
+// except according to those terms.
+
+//! The 64-bit variant of xxHash.
+//!
+//! This is a *very* fast hash, runs circles around all major hashing
+//! algorithms. The implementation has been extensively micro-optimized
+//! to take full advantage of the instruction-level parallelism of
+//! modern hardware.
+//!
+//! Do not use this for any sort of cryptography.
+//!
+//! https://code.google.com/p/xxhash/
+//! http://fastcompression.blogspot.com/2014/07/xxhash-wider-64-bits.html
+
+
+
+// ILP is the heart of this algorithm:
+//
+// "XXH64 is therefore a fairly straighfoward application of XXH methodology
+// to 64-bits : an inner loop with 4 interleaved streams, a tail sequence,
+// to handle input sizes which are not multiple of 32, and a final avalanche,
+// to ensure all bits are properly randomized." - Yann Collet
+//
+// This also means `unsafe` is necessary. The very first iteration gained
+// an immediate 3x speed boost just from removing the bounds checks. The
+// current implementation is good enough that benchmarks against the C
+// implementation must be done with clang: the LLVM/gcc backend difference
+// is a larger factor in the outcome than the code itself.
+//
+// It's probably best to consider this code as an excercise in writing
+// good tests.
+
+#![allow(dead_assignment)] // `read_ptr!`
+
+use core::prelude::*;
+use core::mem::{uninitialized, transmute};
+use core::raw::{Repr};
+use core::ptr::{copy_memory};
+
+use core::default::Default;
+
+use super::{Hash, Hasher, Writer};
+
+static PRIME1: u64 =     11400714785074694791_u64;
+static PRIME2: u64 =     14029467366897019727_u64;
+static PRIME3: u64 =      1609587929392839161_u64;
+static PRIME4: u64 =      9650029242287828579_u64;
+static PRIME5: u64 =      2870177450012600261_u64;
+
+fn rotl64(x: u64, b: uint) -> u64 { #![inline(always)]
+    (x << b) | (x >> (64 - b))
+}
+
+pub fn oneshot(input: &[u8], seed: u64) -> u64 { #![inline]
+    let mut state = XXState::new_with_seed(seed);
+    state.update(input);
+    state.digest()
+}
+
+pub struct XXState {
+    memory: [u64, ..4],
+    v1: u64,
+    v2: u64,
+    v3: u64,
+    v4: u64,
+    total_len: u64,
+    seed: u64,
+    memsize: uint,
+}
+
+// read an integer, advance the pointer by the appropriate amount
+// and do the endian dance
+macro_rules! read_ptr(($p:ident, $size:ty) => ({
+    let mut bp: *const $size = transmute($p);
+    let data: $size = *bp;
+    bp = bp.offset(1);
+    $p = transmute(bp);
+    data.to_le()
+}))
+
+impl XXState {
+    /// Randomize the seed for each set of hashes, e.g. when creating
+    /// a new `HashMap`.
+    pub fn new_with_seed(seed: u64) -> XXState { #![inline]
+        let mut state: XXState = unsafe { uninitialized() };
+        state.reset(seed);
+        state
+    }
+
+    pub fn new() -> XXState { #![inline]
+        XXState::new_with_seed(0)
+    }
+
+    /// Reinitialize. The next input will start a new hash.
+    pub fn reset(&mut self, seed: u64) { #![inline]
+        self.seed = seed;
+        self.v1 = seed + PRIME1 + PRIME2;
+        self.v2 = seed + PRIME2;
+        self.v3 = seed;
+        self.v4 = seed - PRIME1;
+        self.total_len = 0;
+        self.memsize = 0;
+    }
+
+    /// This is where you feed your data in.
+    pub fn update(&mut self, input: &[u8]) { #![inline] unsafe {
+        let mem: *mut u8 = transmute(&self.memory);
+        let mut rem: uint = input.len();
+        let mut data: *const u8 = input.repr().data;
+
+        self.total_len += rem as u64;
+
+        // not enough data for one 32-byte chunk,
+        // so just fill the buffer and return.
+        if self.memsize + rem < 32 {
+            let dst: *mut u8 = mem.offset(self.memsize as int);
+            copy_memory(dst, data, rem);
+            self.memsize += rem;
+            return;
+        }
+
+        // some data left from previous update
+        // fill the buffer and eat it
+        if self.memsize != 0 {
+            let dst: *mut u8 = mem.offset(self.memsize as int);
+            let bump: uint = 32 - self.memsize;
+            copy_memory(dst, data, bump);
+
+            // `read_ptr!` target
+            let mut p: *const u8 = transmute(mem);
+
+            macro_rules! read(($size:ty) => (read_ptr!(p, $size)))
+
+            macro_rules! eat(($v: ident) => ({
+                $v += read!(u64) * PRIME2; $v = rotl64($v, 31); $v *= PRIME1;
+            }))
+
+            // Detaching these does good things to performance.
+            // LLVM is not quite smart enough to do it on its own.
+            let mut v1: u64 = self.v1;
+            let mut v2: u64 = self.v2;
+            let mut v3: u64 = self.v3;
+            let mut v4: u64 = self.v4;
+
+            eat!(v1); eat!(v2); eat!(v3); eat!(v4);
+
+            // save the state
+            self.v1 = v1;
+            self.v2 = v2;
+            self.v3 = v3;
+            self.v4 = v4;
+
+            data = data.offset(bump as int);
+            rem -= bump;
+            self.memsize = 0;
+        }
+
+        {
+            macro_rules! read(($size:ty) => (read_ptr!(data, $size)))
+
+            // Note how `$v` does not depend on any other `v` in this phase.
+            // This is critical for speed.
+            macro_rules! eat(($v: ident) => ({
+                $v += read!(u64) * PRIME2; $v = rotl64($v, 31); $v *= PRIME1;
+            }))
+
+            // again, go faster stripes
+            let mut v1: u64 = self.v1;
+            let mut v2: u64 = self.v2;
+            let mut v3: u64 = self.v3;
+            let mut v4: u64 = self.v4;
+
+            // the main loop: eat whole chunks
+            while rem >= 32 {
+                eat!(v1); eat!(v2); eat!(v3); eat!(v4);
+                rem -= 32;
+            }
+
+            self.v1 = v1;
+            self.v2 = v2;
+            self.v3 = v3;
+            self.v4 = v4;
+        }
+
+        // we have data left, so save it
+        if rem > 0 {
+            copy_memory(mem, data, rem);
+            self.memsize = rem;
+        }
+    }}
+
+    /// Compute the hash. This can be used for intermediate values too.
+    pub fn digest(&self) -> u64 { #![inline] unsafe {
+        let mut rem = self.memsize;
+        let mut h64: u64 = if self.total_len < 32 {
+            self.seed + PRIME5
+        } else {
+            // we have saved state
+            let mut v1: u64 = self.v1;
+            let mut v2: u64 = self.v2;
+            let mut v3: u64 = self.v3;
+            let mut v4: u64 = self.v4;
+
+            let mut h = rotl64(v1, 1) + rotl64(v2, 7) + rotl64(v3, 12) + rotl64(v4, 18);
+
+            macro_rules! permute(($v: ident) => ({
+                $v *= PRIME2; $v = rotl64($v, 31); $v *= PRIME1; h ^= $v; h = h * PRIME1 + PRIME4;
+            }))
+            // this step does not exist in xxh32
+            permute!(v1); permute!(v2); permute!(v3); permute!(v4);
+
+            h
+        };
+
+        // and now we eat all the remaining bytes.
+        let mut p: *const u8 = transmute(&self.memory);
+        macro_rules! read(($size:ty) => (read_ptr!(p, $size)))
+
+        h64 += self.total_len as u64;
+
+        while rem >= 8 {
+            let mut k1: u64 = read!(u64) * PRIME2; k1 = rotl64(k1, 31); k1 *= PRIME1;
+            h64 ^= k1;
+            h64 = rotl64(h64, 27) * PRIME1 + PRIME4;
+            rem -= 8;
+        }
+
+        if rem >= 4 {
+            h64 ^= read!(u32) as u64 * PRIME1;
+            h64 = rotl64(h64, 23) * PRIME2 + PRIME3;
+            rem -= 4;
+        }
+
+        while rem > 0 {
+            h64 ^= read!(u8) as u64 * PRIME5;
+            h64 = rotl64(h64, 11) * PRIME1;
+            rem -= 1;
+        }
+
+        h64 ^= h64 >> 33;
+        h64 *= PRIME2;
+        h64 ^= h64 >> 29;
+        h64 *= PRIME3;
+        h64 ^= h64 >> 32;
+
+        h64
+    }}
+
+}
+
+impl Writer for XXState {
+    fn write(&mut self, msg: &[u8]) { #![inline]
+        self.update(msg);
+    }
+}
+
+impl Clone for XXState {
+    fn clone(&self) -> XXState { #![inline]
+        *self
+    }
+}
+
+/// `XXHasher` computes the xxHash64 algorithm from a stream of bytes.
+pub struct XXHasher {
+    seed: u64
+}
+
+impl XXHasher {
+    pub fn new() -> XXHasher { #![inline]
+        XXHasher::new_with_seed(18446744073709551557u64)
+    }
+
+    pub fn new_with_seed(seed: u64) -> XXHasher { #![inline]
+        XXHasher { seed: seed }
+    }
+}
+
+impl Hasher<XXState> for XXHasher {
+    fn hash<T: Hash<XXState>>(&self, value: &T) -> u64 { #![inline]
+        let mut state = XXState::new_with_seed(self.seed);
+        value.hash(&mut state);
+        state.digest()
+    }
+}
+
+impl Default for XXHasher {
+    fn default() -> XXHasher { #![inline]
+        XXHasher::new()
+    }
+}
+
+pub fn hash<T: Hash<XXState>>(value: &T) -> u64 { #![inline]
+    let mut state = XXState::new();
+    value.hash(&mut state);
+    state.digest()
+}
+
+pub fn hash_with_seed<T: Hash<XXState>>(seed: u64, value: &T) -> u64 { #![inline]
+    let mut state = XXState::new_with_seed(seed);
+    value.hash(&mut state);
+    state.digest()
+}
+
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::prelude::*;
+    use std::vec::Vec;
+    use test::Bencher;
+
+
+    /// the official sanity test
+    fn test_base(f: |&[u8], u64| -> u64) { #![inline(always)]
+        static BUFSIZE: uint = 101;
+        static PRIME: u32 = 2654435761;
+
+        let mut random: u32 = PRIME;
+        let mut buf: Vec<u8> = Vec::with_capacity(BUFSIZE);
+        for _ in range(0, BUFSIZE) {
+            buf.push((random >> 24) as u8);
+            random *= random;
+        }
+
+        let test = |size: uint, seed: u64, expected: u64| {
+            let result = f(buf.slice_to(size), seed);
+            assert_eq!(result, expected);
+        };
+
+        test(1,                0,             0x4FCE394CC88952D8);
+        test(1,                PRIME as u64,  0x739840CB819FA723);
+        test(14,               0,             0xCFFA8DB881BC3A3D);
+        test(14,               PRIME as u64,  0x5B9611585EFCC9CB);
+        test(BUFSIZE,          0,             0x0EAB543384F878AD);
+        test(BUFSIZE,          PRIME as u64,  0xCAA65939306F1E21);
+    }
+
+    #[cfg(test)]
+    fn bench_base(bench: &mut Bencher, f: |&[u8]| -> u64 ) { #![inline(always)]
+        static BUFSIZE: uint = 64*1024;
+
+        let mut v: Vec<u8> = Vec::with_capacity(BUFSIZE);
+        for i in range(0, BUFSIZE) {
+            v.push(i as u8);
+        }
+
+        bench.iter( || f(v.as_slice()) );
+        bench.bytes = BUFSIZE as u64;
+    }
+
+    #[test]
+    fn test_oneshot() {
+        test_base(|v, seed|{
+            let mut state = XXState::new_with_seed(seed);
+            state.update(v);
+            state.digest()
+        })
+    }
+
+    #[test]
+    fn test_chunks() {
+        test_base(|v, seed|{
+            let mut state = XXState::new_with_seed(seed);
+            for chunk in v.chunks(15) {
+                state.update(chunk);
+            }
+            state.digest()
+        })
+    }
+
+    #[bench]
+    fn bench_64k_oneshot(b: &mut Bencher) {
+        bench_base(b, |v| { oneshot(v, 0) })
+    }
+
+    /*
+    * The following tests match those of SipHash.
+    */
+
+
+    #[test] #[cfg(target_arch = "arm")]
+    fn test_hash_uint() {
+        let val = 0xdeadbeef_deadbeef_u64;
+        assert!(hash(&(val as u64)) != hash(&(val as uint)));
+        assert_eq!(hash(&(val as u32)), hash(&(val as uint)));
+    }
+    #[test] #[cfg(target_arch = "x86_64")]
+    fn test_hash_uint() {
+        let val = 0xdeadbeef_deadbeef_u64;
+        assert_eq!(hash(&(val as u64)), hash(&(val as uint)));
+        assert!(hash(&(val as u32)) != hash(&(val as uint)));
+    }
+    #[test] #[cfg(target_arch = "x86")]
+    fn test_hash_uint() {
+        let val = 0xdeadbeef_deadbeef_u64;
+        assert!(hash(&(val as u64)) != hash(&(val as uint)));
+        assert_eq!(hash(&(val as u32)), hash(&(val as uint)));
+    }
+
+    #[test]
+    fn test_hash_idempotent() {
+        let val64 = 0xdeadbeef_deadbeef_u64;
+        assert_eq!(hash(&val64), hash(&val64));
+        let val32 = 0xdeadbeef_u32;
+        assert_eq!(hash(&val32), hash(&val32));
+    }
+
+    #[test]
+    fn test_hash_no_bytes_dropped_64() {
+        let val = 0xdeadbeef_deadbeef_u64;
+
+        assert!(hash(&val) != hash(&zero_byte(val, 0)));
+        assert!(hash(&val) != hash(&zero_byte(val, 1)));
+        assert!(hash(&val) != hash(&zero_byte(val, 2)));
+        assert!(hash(&val) != hash(&zero_byte(val, 3)));
+        assert!(hash(&val) != hash(&zero_byte(val, 4)));
+        assert!(hash(&val) != hash(&zero_byte(val, 5)));
+        assert!(hash(&val) != hash(&zero_byte(val, 6)));
+        assert!(hash(&val) != hash(&zero_byte(val, 7)));
+
+        fn zero_byte(val: u64, byte: uint) -> u64 {
+            assert!(byte < 8);
+            val & !(0xff << (byte * 8))
+        }
+    }
+
+    #[test]
+    fn test_hash_no_bytes_dropped_32() {
+        let val = 0xdeadbeef_u32;
+
+        assert!(hash(&val) != hash(&zero_byte(val, 0)));
+        assert!(hash(&val) != hash(&zero_byte(val, 1)));
+        assert!(hash(&val) != hash(&zero_byte(val, 2)));
+        assert!(hash(&val) != hash(&zero_byte(val, 3)));
+
+        fn zero_byte(val: u32, byte: uint) -> u32 {
+            assert!(byte < 4);
+            val & !(0xff << (byte * 8))
+        }
+    }
+
+    #[test]
+    fn test_hash_no_concat_alias() {
+        let s = ("aa", "bb");
+        let t = ("aabb", "");
+        let u = ("a", "abb");
+
+        assert!(s != t && t != u);
+        assert!(hash(&s) != hash(&t) && hash(&s) != hash(&u));
+
+        let v: (&[u8], &[u8], &[u8]) = (&[1u8], &[0u8, 0], &[0u8]);
+        let w: (&[u8], &[u8], &[u8]) = (&[1u8, 0, 0, 0], &[], &[]);
+
+        assert!(v != w);
+        assert!(hash(&v) != hash(&w));
+    }
+
+    #[bench]
+    fn bench_str_under_8_bytes(b: &mut Bencher) {
+        let s = "foo";
+        b.bytes=s.len() as u64;
+        b.iter(|| {
+            hash(&s)
+        })
+    }
+
+    #[bench]
+    fn bench_str_of_8_bytes(b: &mut Bencher) {
+        let s = "foobar78";
+        b.bytes = s.len() as u64;
+        b.iter(|| {
+            hash(&s);
+        })
+    }
+
+    #[bench]
+    fn bench_str_over_8_bytes(b: &mut Bencher) {
+        let s = "foobarbaz0";
+        b.bytes = s.len() as u64;
+        b.iter(|| {
+            hash(&s)
+        })
+    }
+
+    #[bench]
+    fn bench_long_str(b: &mut Bencher) {
+        let s = "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod tempor \
+    incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud \
+    exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. Duis aute \
+    irure dolor in reprehenderit in voluptate velit esse cillum dolore eu fugiat nulla \
+    pariatur. Excepteur sint occaecat cupidatat non proident, sunt in culpa qui \
+    officia deserunt mollit anim id est laborum.";
+        b.bytes = s.len() as u64;
+        b.iter(|| {
+            hash(&s)
+        })
+    }
+
+    #[bench]
+    fn bench_u64(b: &mut Bencher) {
+        let u = 16262950014981195938u64;
+        b.bytes = 8;
+        b.iter(|| {
+            hash(&u)
+        })
+    }
+}