diff --git a/src/jitter.rs b/src/jitter.rs
index a3914834b5d..7585304ae42 100644
--- a/src/jitter.rs
+++ b/src/jitter.rs
@@ -48,25 +48,53 @@ const MEMORY_SIZE: usize = MEMORY_BLOCKS * MEMORY_BLOCKSIZE;
 // Note: the C implementation relies on being compiled without optimizations.
 // This implementation goes through lengths to make the compiler not optimise
 // out what is technically dead code, but that does influence timing jitter.
-pub struct JitterRng {
+pub struct JitterRng<T: JitterTimer> {
     data: u64, // Actual random number
     // Number of rounds to run the entropy collector per 64 bits
-    rounds: u32,
-    // Timer and previous time stamp, used by `measure_jitter`
-    timer: fn() -> u64,
+    rounds: u8,
+    // Timer used by `measure_jitter`
+    timer: T,
+    // Memory for the Memory Access noise source FIXME
+    mem_prev_index: u16,
+    // Make `next_u32` not waste 32 bits
+    data_half_used: bool,
+}
+
+// Entropy collector state.
+// These values are not necessary to preserve across runs.
+struct EcState {
+    // Previous time stamp to determine the timer delta
     prev_time: u64,
     // Deltas used for the stuck test
-    last_delta: i64,
-    last_delta2: i64,
+    last_delta: i32,
+    last_delta2: i32,
     // Memory for the Memory Access noise source
-    mem_prev_index: usize,
     mem: [u8; MEMORY_SIZE],
-    // Make `next_u32` not waste 32 bits
-    data_remaining: Option<u32>,
+}
+
+impl EcState {
+    // Stuck test by checking the:
+    // - 1st derivation of the jitter measurement (time delta)
+    // - 2nd derivation of the jitter measurement (delta of time deltas)
+    // - 3rd derivation of the jitter measurement (delta of delta of time
+    //   deltas)
+    //
+    // All values must always be non-zero.
+    // This test is a heuristic to see whether the last measurement holds
+    // entropy.
+    fn stuck(&mut self, current_delta: i32) -> bool {
+        let delta2 = self.last_delta - current_delta;
+        let delta3 = delta2 - self.last_delta2;
+
+        self.last_delta = current_delta;
+        self.last_delta2 = delta2;
+
+        current_delta == 0 || delta2 == 0 || delta3 == 0
+    }
 }
 
 // Custom Debug implementation that does not expose the internal state
-impl fmt::Debug for JitterRng {
+impl<T: JitterTimer> fmt::Debug for JitterRng<T> {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         write!(f, "JitterRng {{}}")
     }
@@ -126,28 +154,34 @@ impl From<TimerError> for Error {
 #[cfg(feature="std")]
 static JITTER_ROUNDS: AtomicUsize = ATOMIC_USIZE_INIT;
 
-impl JitterRng {
+#[cfg(feature="std")]
+impl JitterRng<Timer> {
     /// Create a new `JitterRng`.
     /// Makes use of `std::time` for a timer.
     ///
     /// During initialization CPU execution timing jitter is measured a few
     /// hundred times. If this does not pass basic quality tests, an error is
     /// returned. The test result is cached to make subsequent calls faster.
-    #[cfg(feature="std")]
-    pub fn new() -> Result<JitterRng, TimerError> {
-        let mut ec = JitterRng::new_with_timer(platform::get_nstime);
-        let mut rounds = JITTER_ROUNDS.load(Ordering::Relaxed) as u32;
+    pub fn new() -> Result<JitterRng<Timer>, TimerError> {
+        let mut state = JitterRng::new_with_timer(Timer::default());
+
+        let mut rounds = JITTER_ROUNDS.load(Ordering::Relaxed) as u8;
         if rounds == 0 {
             // No result yet: run test.
             // This allows the timer test to run multiple times; we don't care.
-            rounds = ec.test_timer()?;
+            rounds = state.test_timer()?;
             JITTER_ROUNDS.store(rounds as usize, Ordering::Relaxed);
             info!("JitterRng: using {} rounds per u64 output", rounds);
         }
-        ec.set_rounds(rounds);
-        Ok(ec)
+        state.set_rounds(rounds);
+
+        // Fill `data` with a non-zero value.
+        state.gen_entropy();
+        Ok(state)
     }
+}
 
+impl<T: JitterTimer+Clone> JitterRng<T> {
     /// Create a new `JitterRng`.
     /// A custom timer can be supplied, making it possible to use `JitterRng` in
     /// `no_std` environments.
@@ -156,32 +190,17 @@ impl JitterRng {
     ///
     /// This method is more low-level than `new()`. It is the responsibility of
     /// the caller to run `test_timer` before using any numbers generated with
-    /// `JitterRng`, and optionally call `set_rounds()`.
-    pub fn new_with_timer(timer: fn() -> u64) -> JitterRng {
-        let mut ec = JitterRng {
+    /// `JitterRng`, and optionally call `set_rounds()`. Also it is important to
+    /// call `gen_entropy` once before using the first result to initialize the
+    /// entropy collection pool.
+    pub fn new_with_timer(timer: T) -> JitterRng<T> {
+        JitterRng {
             data: 0,
             rounds: 64,
-            timer: timer,
-            prev_time: 0,
-            last_delta: 0,
-            last_delta2: 0,
+            timer: timer.clone(),
             mem_prev_index: 0,
-            mem: [0; MEMORY_SIZE],
-            data_remaining: None,
-        };
-
-        // Fill `data`, `prev_time`, `last_delta` and `last_delta2` with
-        // non-zero values.
-        ec.prev_time = timer();
-        ec.gen_entropy();
-
-        // Do a single read from `self.mem` to make sure the Memory Access noise
-        // source is not optimised out.
-        // Note: this read is important, it effects optimisations for the entire
-        // module!
-        black_box(ec.mem[0]);
-
-        ec
+            data_half_used: false,
+        }
     }
 
     /// Configures how many rounds are used to generate each 64-bit value.
@@ -192,7 +211,7 @@ impl JitterRng {
     /// can be used. The `test_timer()` function returns the minimum number of
     /// rounds required for full strength (platform dependent), so one may use
     /// `rng.set_rounds(rng.test_timer()?);` or cache the value.
-    pub fn set_rounds(&mut self, rounds: u32) {
+    pub fn set_rounds(&mut self, rounds: u8) {
         assert!(rounds > 0);
         self.rounds = rounds;
     }
@@ -209,7 +228,7 @@ impl JitterRng {
     fn random_loop_cnt(&mut self, n_bits: u32) -> u32 {
         let mut rounds = 0;
 
-        let mut time = (self.timer)();
+        let mut time = self.timer.get_nstime();
         // Mix with the current state of the random number balance the random
         // loop counter a bit more.
         time ^= self.data;
@@ -296,11 +315,11 @@ impl JitterRng {
     // range of wait states. However, to reliably access either L3 or memory,
     // the `self.mem` memory must be quite large which is usually not desirable.
     #[inline(never)]
-    fn memaccess(&mut self, var_rounds: bool) {
+    fn memaccess(&mut self, mem: &mut [u8; MEMORY_SIZE], var_rounds: bool) {
         let mut acc_loop_cnt = 128;
         if var_rounds { acc_loop_cnt += self.random_loop_cnt(4) };
 
-        let mut index = self.mem_prev_index;
+        let mut index = self.mem_prev_index as usize;
         for _ in 0..acc_loop_cnt {
             // Addition of memblocksize - 1 to index with wrap around logic to
             // ensure that every memory location is hit evenly.
@@ -310,58 +329,37 @@ impl JitterRng {
 
             // memory access: just add 1 to one byte
             // memory access implies read from and write to memory location
-            let tmp = self.mem[index];
-            self.mem[index] = tmp.wrapping_add(1);
+            mem[index] = mem[index].wrapping_add(1);
         }
-        self.mem_prev_index = index;
-    }
-
-
-    // Stuck test by checking the:
-    // - 1st derivation of the jitter measurement (time delta)
-    // - 2nd derivation of the jitter measurement (delta of time deltas)
-    // - 3rd derivation of the jitter measurement (delta of delta of time
-    //   deltas)
-    //
-    // All values must always be non-zero.
-    // This test is a heuristic to see whether the last measurement holds
-    // entropy.
-    fn stuck(&mut self, current_delta: i64) -> bool {
-        let delta2 = self.last_delta - current_delta;
-        let delta3 = delta2 - self.last_delta2;
-
-        self.last_delta = current_delta;
-        self.last_delta2 = delta2;
-
-        current_delta == 0 || delta2 == 0 || delta3 == 0
+        self.mem_prev_index = index as u16;
     }
 
     // This is the heart of the entropy generation: calculate time deltas and
     // use the CPU jitter in the time deltas. The jitter is injected into the
     // entropy pool.
     //
-    // Ensure that `self.prev_time` is primed before using the output of this
+    // Ensure that `ec.prev_time` is primed before using the output of this
     // function. This can be done by calling this function and not using its
     // result.
-    fn measure_jitter(&mut self) -> Option<()> {
+    fn measure_jitter(&mut self, ec: &mut EcState) -> Option<()> {
         // Invoke one noise source before time measurement to add variations
-        self.memaccess(true);
+        self.memaccess(&mut ec.mem, true);
 
         // Get time stamp and calculate time delta to previous
         // invocation to measure the timing variations
-        let time = (self.timer)();
+        let time = self.timer.get_nstime();
         // Note: wrapping_sub combined with a cast to `i64` generates a correct
         // delta, even in the unlikely case this is a timer that is not strictly
         // monotonic.
-        let current_delta = time.wrapping_sub(self.prev_time) as i64;
-        self.prev_time = time;
+        let current_delta = time.wrapping_sub(ec.prev_time) as i64 as i32;
+        ec.prev_time = time;
 
         // Call the next noise source which also injects the data
         self.lfsr_time(current_delta as u64, true);
 
         // Check whether we have a stuck measurement (i.e. does the last
         // measurement holds entropy?).
-        if self.stuck(current_delta) { return None };
+        if ec.stuck(current_delta) { return None };
 
         // Rotate the data buffer by a prime number (any odd number would
         // do) to ensure that every bit position of the input time stamp
@@ -424,18 +422,28 @@ impl JitterRng {
 
     fn gen_entropy(&mut self) -> u64 {
         trace!("JitterRng: collecting entropy");
-        
-        // Prime `self.prev_time`, and run the noice sources to make sure the
+
+        // Prime `ec.prev_time`, and run the noice sources to make sure the
         // first loop round collects the expected entropy.
-        let _ = self.measure_jitter();
+        let mut ec = EcState {
+            prev_time: self.timer.get_nstime(),
+            last_delta: 0,
+            last_delta2: 0,
+            mem: [0; MEMORY_SIZE],
+        };
+        let _ = self.measure_jitter(&mut ec);
 
         for _ in 0..self.rounds {
             // If a stuck measurement is received, repeat measurement
             // Note: we do not guard against an infinite loop, that would mean
             // the timer suddenly became broken.
-            while self.measure_jitter().is_none() {}
+            while self.measure_jitter(&mut ec).is_none() {}
         }
 
+        // Do a single read from `self.mem` to make sure the Memory Access noise
+        // source is not optimised out.
+        black_box(ec.mem[0]);
+
         self.stir_pool();
         self.data
     }
@@ -446,7 +454,7 @@ impl JitterRng {
     /// If succesful, this will return the estimated number of rounds necessary
     /// to collect 64 bits of entropy. Otherwise a `TimerError` with the cause
     /// of the failure will be returned.
-    pub fn test_timer(&mut self) -> Result<u32, TimerError> {
+    pub fn test_timer(&mut self) -> Result<u8, TimerError> {
         debug!("JitterRng: testing timer ...");
         // We could add a check for system capabilities such as `clock_getres`
         // or check for `CONFIG_X86_TSC`, but it does not make much sense as the
@@ -462,6 +470,13 @@ impl JitterRng {
         let mut count_mod = 0;
         let mut count_stuck = 0;
 
+        let mut ec = EcState {
+            prev_time: self.timer.get_nstime(),
+            last_delta: 0,
+            last_delta2: 0,
+            mem: [0; MEMORY_SIZE],
+        };
+
         // TESTLOOPCOUNT needs some loops to identify edge systems.
         // 100 is definitely too little.
         const TESTLOOPCOUNT: u64 = 300;
@@ -469,16 +484,16 @@ impl JitterRng {
 
         for i in 0..(CLEARCACHE + TESTLOOPCOUNT) {
             // Measure time delta of core entropy collection logic
-            let time = (self.timer)();
-            self.memaccess(true);
+            let time = self.timer.get_nstime();
+            self.memaccess(&mut ec.mem, true);
             self.lfsr_time(time, true);
-            let time2 = (self.timer)();
+            let time2 = self.timer.get_nstime();
 
             // Test whether timer works
             if time == 0 || time2 == 0 {
                 return Err(TimerError::NoTimer);
             }
-            let delta = time2.wrapping_sub(time) as i64;
+            let delta = time2.wrapping_sub(time) as i64 as i32;
 
             // Test whether timer is fine grained enough to provide delta even
             // when called shortly after each other -- this implies that we also
@@ -494,7 +509,7 @@ impl JitterRng {
             // measurements.
             if i < CLEARCACHE { continue; }
 
-            if self.stuck(delta) { count_stuck += 1; }
+            if ec.stuck(delta) { count_stuck += 1; }
 
             // Test whether we have an increasing timer.
             if !(time2 > time) { time_backwards += 1; }
@@ -510,6 +525,10 @@ impl JitterRng {
             old_delta = delta;
         }
 
+        // Do a single read from `self.mem` to make sure the Memory Access noise
+        // source is not optimised out.
+        black_box(ec.mem[0]);
+
         // We allow the time to run backwards for up to three times.
         // This can happen if the clock is being adjusted by NTP operations.
         // If such an operation just happens to interfere with our test, it
@@ -550,26 +569,29 @@ impl JitterRng {
         // available bits of entropy per round here for two reasons:
         // 1. Simple estimates of the available bits (like Shannon entropy) are
         //    too optimistic.
-        // 2)  Unless we want to waste a lot of time during intialization, there
-        //     only a small number of samples are available.
+        // 2. Unless we want to waste a lot of time during intialization, there
+        //    only a small number of samples are available.
         //
         // Therefore we use a very simple and conservative estimate:
         // `let bits_of_entropy = log2(delta_average) / 2`.
         //
         // The number of rounds `measure_jitter` should run to collect 64 bits
         // of entropy is `64 / bits_of_entropy`.
-        //
-        // To have smaller rounding errors, intermediate values are multiplied
-        // by `FACTOR`. To compensate for `log2` and division rounding down,
-        // add 1.
         let delta_average = delta_sum / TESTLOOPCOUNT;
-        // println!("delta_average: {}", delta_average);
 
-        const FACTOR: u32  = 3;
-        fn log2(x: u64) -> u32 { 64 - x.leading_zeros() }
-
-        // pow(δ, FACTOR) must be representable; if you have overflow reduce FACTOR
-        Ok(64 * 2 * FACTOR / (log2(delta_average.pow(FACTOR)) + 1))
+        if delta_average >= 16 {
+            let log2 = 64 - delta_average.leading_zeros();
+            // Do something similar to roundup(64/(log2/2)):
+            Ok( ((64u32 * 2 + log2 - 1) / log2) as u8)
+        } else {
+            // For values < 16 the rounding error becomes too large, use a
+            // lookup table.
+            // Values 0 and 1 are invalid, and filtered out by the
+            // `delta_sum < TESTLOOPCOUNT` test above.
+            let log2_lookup = [0,  0, 128, 81, 64, 56, 50, 46,
+                               43, 41, 39, 38, 36, 35, 34, 33];
+            Ok(log2_lookup[delta_average as usize])
+        }
     }
 
     /// Statistical test: return the timer delta of one normal run of the
@@ -616,28 +638,33 @@ impl JitterRng {
     ///
     /// ```rust,no_run
     /// use rand::JitterRng;
+    /// use rand::jitter::JitterTimer;
     ///
     /// # use std::error::Error;
     /// # use std::fs::File;
     /// # use std::io::Write;
     /// #
     /// # fn try_main() -> Result<(), Box<Error>> {
-    /// fn get_nstime() -> u64 {
-    ///     use std::time::{SystemTime, UNIX_EPOCH};
+    /// #[derive(Clone, Debug, Default)]
+    /// struct Timer;
+    /// impl JitterTimer for Timer {
+    ///     fn get_nstime(&self) -> u64 {
+    ///         use std::time::{SystemTime, UNIX_EPOCH};
     ///
-    ///     let dur = SystemTime::now().duration_since(UNIX_EPOCH).unwrap();
-    ///     // The correct way to calculate the current time is
-    ///     // `dur.as_secs() * 1_000_000_000 + dur.subsec_nanos() as u64`
-    ///     // But this is faster, and the difference in terms of entropy is
-    ///     // negligible (log2(10^9) == 29.9).
-    ///     dur.as_secs() << 30 | dur.subsec_nanos() as u64
+    ///         let dur = SystemTime::now().duration_since(UNIX_EPOCH).unwrap();
+    ///         // The correct way to calculate the current time is
+    ///         // `dur.as_secs() * 1_000_000_000 + dur.subsec_nanos() as u64`
+    ///         // But this is faster, and the difference in terms of entropy is
+    ///         // negligible (log2(10^9) == 29.9).
+    ///         dur.as_secs() << 30 | dur.subsec_nanos() as u64
+    ///     }
     /// }
     ///
     /// // Do not initialize with `JitterRng::new`, but with `new_with_timer`.
     /// // 'new' always runst `test_timer`, and can therefore fail to
     /// // initialize. We want to be able to get the statistics even when the
     /// // timer test fails.
-    /// let mut rng = JitterRng::new_with_timer(get_nstime);
+    /// let mut rng = JitterRng::new_with_timer(Timer);
     ///
     /// // 1_000_000 results are required for the NIST SP 800-90B Entropy
     /// // Estimation Suite
@@ -665,18 +692,37 @@ impl JitterRng {
     /// ```
     #[cfg(feature="std")]
     pub fn timer_stats(&mut self, var_rounds: bool) -> i64 {
-        let time = platform::get_nstime();
-        self.memaccess(var_rounds);
+        let timer = Timer::default();
+        let mut mem = [0; MEMORY_SIZE];
+
+        let time = timer.get_nstime();
+        self.memaccess(&mut mem, var_rounds);
         self.lfsr_time(time, var_rounds);
-        let time2 = platform::get_nstime();
+        let time2 = timer.get_nstime();
         time2.wrapping_sub(time) as i64
     }
 }
 
-#[cfg(feature="std")]
-mod platform {
-    #[cfg(not(any(target_os = "macos", target_os = "ios", target_os = "windows", all(target_arch = "wasm32", not(target_os = "emscripten")))))]
-    pub fn get_nstime() -> u64 {
+/// Timer to be used by `JitterRng`.
+///
+/// Implement this trait to supply a custom timer to `JitterRng` with
+/// `new_with_timer`, making it possible to use in `no_std` environments.
+///
+/// The timer must have nanosecond precision.
+pub trait JitterTimer: Sized {
+    fn get_nstime(&self) -> u64;
+}
+
+#[derive(Clone, Debug, Default)]
+pub struct Timer;
+
+#[cfg(all(feature="std",
+          not(any(target_os = "macos",
+                  target_os = "ios",
+                  target_os = "windows",
+                  all(target_arch = "wasm32", not(target_os = "emscripten"))))))]
+impl JitterTimer for Timer {
+    fn get_nstime(&self) -> u64 {
         use std::time::{SystemTime, UNIX_EPOCH};
 
         let dur = SystemTime::now().duration_since(UNIX_EPOCH).unwrap();
@@ -686,9 +732,12 @@ mod platform {
         // (log2(10^9) == 29.9).
         dur.as_secs() << 30 | dur.subsec_nanos() as u64
     }
+}
 
-    #[cfg(any(target_os = "macos", target_os = "ios"))]
-    pub fn get_nstime() -> u64 {
+#[cfg(all(feature="std",
+      any(target_os = "macos", target_os = "ios")))]
+impl JitterTimer for Timer {
+    fn get_nstime(&self) -> u64 {
         extern crate libc;
         // On Mac OS and iOS std::time::SystemTime only has 1000ns resolution.
         // We use `mach_absolute_time` instead. This provides a CPU dependent unit,
@@ -698,9 +747,11 @@ mod platform {
         // use the raw result.
         unsafe { libc::mach_absolute_time() }
     }
+}
 
-    #[cfg(target_os = "windows")]
-    pub fn get_nstime() -> u64 {
+#[cfg(all(feature="std", target_os = "windows"))]
+impl JitterTimer for Timer {
+    fn get_nstime(&self) -> u64 {
         extern crate winapi;
         unsafe {
             let mut t = super::mem::zeroed();
@@ -708,9 +759,13 @@ mod platform {
             *t.QuadPart() as u64
         }
     }
+}
 
-    #[cfg(all(target_arch = "wasm32", not(target_os = "emscripten")))]
-    pub fn get_nstime() -> u64 {
+#[cfg(all(feature="std",
+          target_arch = "wasm32",
+          not(target_os = "emscripten")))]
+impl JitterTimer for Timer {
+    fn get_nstime(&self) -> u64 {
         unreachable!()
     }
 }
@@ -725,19 +780,21 @@ fn black_box<T>(dummy: T) -> T {
     }
 }
 
-impl Rng for JitterRng {
+impl<T: JitterTimer+Clone> Rng for JitterRng<T> {
     fn next_u32(&mut self) -> u32 {
         // We want to use both parts of the generated entropy
-        if let Some(high) = self.data_remaining.take() {
-            high
+        if self.data_half_used {
+            self.data_half_used = false;
+            (self.data >> 32) as u32
         } else {
-            let data = self.next_u64();
-            self.data_remaining = Some((data >> 32) as u32);
-            data as u32
+            self.data = self.next_u64();
+            self.data_half_used = true;
+            self.data as u32
         }
     }
 
     fn next_u64(&mut self) -> u64 {
+       self.data_half_used = false;
        self.gen_entropy()
     }