diff --git a/Cargo.toml b/Cargo.toml
index 7c2f62d..9ee1ca1 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -14,3 +14,9 @@ license = "MIT"
 
 [dev-dependencies]
 recycler="0.1.4"
+
+[profile.bench]
+# Multiple codegen units speed up compilation, but make compilation output less
+# deteministic and generally decrease codegen quality through worse inlining.
+# Let's turn it off for benchmarking.
+codegen-units = 1
diff --git a/README.md b/README.md
index 1c8565c..13de90c 100644
--- a/README.md
+++ b/README.md
@@ -3,7 +3,7 @@ A mortifying serialization library for Rust
 
 Abomonation (spelling intentional) is a serialization library for Rust based on the very simple idea that if someone presents data for serialization it will copy those exact bits, and then follow any pointers and copy those bits, and so on. When deserializing it recovers the exact bits, and then corrects pointers to aim at the serialized forms of the chased data.
 
-**Warning**: Abomonation should not be used on any data you care strongly about, or from any computer you value the data on. The `encode` and `decode` methods do things that may be undefined behavior, and you shouldn't stand for that. Specifically, `encode` exposes padding bytes to `memcpy`, and `decode` doesn't much respect alignment.
+**Warning**: Abomonation should not be used on any data you care strongly about, or from any computer you value the data on. The `encode` and `decode` methods do things that may be undefined behavior, and you shouldn't stand for that. Specifically, `encode` exposes padding bytes to `memcpy`, and `decode` doesn't much respect alignment and may need to construct Rust references to invalid data.
 
 Please consult the [abomonation documentation](https://frankmcsherry.github.com/abomonation) for more specific information.
 
@@ -49,7 +49,7 @@ Be warned that these numbers are not *goodput*, but rather the total number of b
 
 ## unsafe_abomonate!
 
-Abomonation comes with the `unsafe_abomonate!` macro implementing `Abomonation` for structs which are essentially equivalent to a tuple of other `Abomonable` types. To use the macro, you must put the `#[macro_use]` modifier before `extern crate abomonation;`.
+Abomonation comes with the `unsafe_abomonate!` macro implementing `Abomonation` for structs which are essentially equivalent to a tuple of other `Abomonation` types. To use the macro, you must put the `#[macro_use]` modifier before `extern crate abomonation;`.
 
 Please note that `unsafe_abomonate!` synthesizes unsafe implementations of `Abomonation`, and it is should be considered unsafe to invoke.
 
@@ -82,4 +82,4 @@ if let Some((result, remaining)) = unsafe { decode::<MyStruct>(&mut bytes) } {
 }
 ```
 
-Be warned that implementing `Abomonable` for types can be a giant disaster and is entirely discouraged.
+Be warned that implementing `Abomonation` for types can be a giant disaster and is entirely discouraged.
diff --git a/benches/bench.rs b/benches/bench.rs
index 9ce8a3c..e5d0c2b 100644
--- a/benches/bench.rs
+++ b/benches/bench.rs
@@ -30,8 +30,9 @@ use test::Bencher;
 #[bench] fn vec_u_vn_s_enc(bencher: &mut Bencher) { _bench_enc(bencher, vec![vec![(0u64, vec![(); 1 << 40], format!("grawwwwrr!")); 32]; 32]); }
 #[bench] fn vec_u_vn_s_dec(bencher: &mut Bencher) { _bench_dec(bencher, vec![vec![(0u64, vec![(); 1 << 40], format!("grawwwwrr!")); 32]; 32]); }
 
-fn _bench_enc<T: Abomonation>(bencher: &mut Bencher, record: T) {
-
+fn _bench_enc<T>(bencher: &mut Bencher, record: T)
+    where for<'de> T: Abomonation<'de>
+{
     // prepare encoded data for bencher.bytes
     let mut bytes = Vec::new();
     unsafe { encode(&record, &mut bytes).unwrap(); }
@@ -40,12 +41,13 @@ fn _bench_enc<T: Abomonation>(bencher: &mut Bencher, record: T) {
     bencher.bytes = bytes.len() as u64;
     bencher.iter(|| {
         bytes.clear();
-        unsafe { encode(&record, &mut bytes).unwrap(); }
+        unsafe { encode(&record, &mut bytes).unwrap() }
     });
 }
 
-fn _bench_dec<T: Abomonation+Eq>(bencher: &mut Bencher, record: T) {
-
+fn _bench_dec<T>(bencher: &mut Bencher, record: T)
+    where for<'de> T: Abomonation<'de> + Eq
+{
     // prepare encoded data
     let mut bytes = Vec::new();
     unsafe { encode(&record, &mut bytes).unwrap(); }
diff --git a/benches/clone.rs b/benches/clone.rs
index a040895..7078d3d 100644
--- a/benches/clone.rs
+++ b/benches/clone.rs
@@ -27,8 +27,9 @@ use test::Bencher;
 #[bench] fn vec_u_vn_s_e_d(bencher: &mut Bencher) { _bench_e_d(bencher, vec![vec![(0u64, vec![(); 1 << 40], format!("grawwwwrr!")); 32]; 32]); }
 #[bench] fn vec_u_vn_s_cln(bencher: &mut Bencher) { _bench_cln(bencher, vec![vec![(0u64, vec![(); 1 << 40], format!("grawwwwrr!")); 32]; 32]); }
 
-fn _bench_e_d<T: Abomonation>(bencher: &mut Bencher, record: T) {
-
+fn _bench_e_d<T>(bencher: &mut Bencher, record: T)
+    where for<'de> T: Abomonation<'de>
+{
     // prepare encoded data for bencher.bytes
     let mut bytes = Vec::new();
     unsafe { encode(&record, &mut bytes).unwrap(); }
@@ -42,8 +43,9 @@ fn _bench_e_d<T: Abomonation>(bencher: &mut Bencher, record: T) {
     });
 }
 
-fn _bench_cln<T: Abomonation+Clone>(bencher: &mut Bencher, record: T) {
-
+fn _bench_cln<T>(bencher: &mut Bencher, record: T)
+    where for<'de> T: Abomonation<'de> + Clone
+{
     // prepare encoded data
     let mut bytes = Vec::new();
     unsafe { encode(&record, &mut bytes).unwrap(); }
diff --git a/benches/recycler.rs b/benches/recycler.rs
index cc9ae94..fef1bee 100644
--- a/benches/recycler.rs
+++ b/benches/recycler.rs
@@ -27,8 +27,9 @@ use test::Bencher;
 // TODO : this reveals that working with a `vec![(); 1 << 40]` does not get optimized away.
 // #[bench] fn vec_u_vn_s_rec(bencher: &mut Bencher) { _bench_rec(bencher, vec![vec![(0u64, vec![(); 1 << 40], format!("grawwwwrr!")); 32]; 32]); }
 
-fn _bench_own<T: Abomonation+Clone>(bencher: &mut Bencher, record: T) {
-
+fn _bench_own<T>(bencher: &mut Bencher, record: T)
+    where for<'de> T: Abomonation<'de> + Clone
+{
     // prepare encoded data
     let mut bytes = Vec::new();
     unsafe { encode(&record, &mut bytes).unwrap(); }
@@ -42,8 +43,9 @@ fn _bench_own<T: Abomonation+Clone>(bencher: &mut Bencher, record: T) {
 }
 
 
-fn _bench_rec<T: Abomonation+Recyclable>(bencher: &mut Bencher, record: T) {
-
+fn _bench_rec<T>(bencher: &mut Bencher, record: T)
+    where for<'de> T: Abomonation<'de> + Recyclable
+{
     // prepare encoded data
     let mut bytes = Vec::new();
     unsafe { encode(&record, &mut bytes).unwrap(); }
diff --git a/src/abomonated.rs b/src/abomonated.rs
index 328b195..02732ca 100644
--- a/src/abomonated.rs
+++ b/src/abomonated.rs
@@ -1,5 +1,4 @@
 
-use std::mem::transmute;
 use std::marker::PhantomData;
 use std::ops::{Deref, DerefMut};
 
@@ -7,17 +6,22 @@ use super::{Abomonation, decode};
 
 /// A type wrapping owned decoded abomonated data.
 ///
-/// This type ensures that decoding and pointer correction has already happened,
-/// and implements `Deref<Target=T>` using a pointer cast (transmute).
+/// This type ensures that decoding and pointer correction has already happened.
+/// It provides a way to move the deserialized data around, while keeping
+/// on-demand access to it via the `as_ref()` method.
+///
+/// As an extra convenience, `Deref<Target=T>` is also implemented if T does
+/// not contain references. Unfortunately, this trait cannot be safely
+/// implemented when T does contain references.
 ///
 /// #Safety
 ///
-/// The safety of this type, and in particular its `transute` implementation of
-/// the `Deref` trait, relies on the owned bytes not being externally mutated
-/// once provided. You could imagine a new type implementing `DerefMut` as required,
-/// but which also retains the ability (e.g. through `RefCell`) to mutate the bytes.
-/// This would be very bad, but seems hard to prevent in the type system. Please
-/// don't do this.
+/// The safety of this type, and in particular of access to the deserialized
+/// data, relies on the owned bytes not being externally mutated after the
+/// `Abomonated` is constructed. You could imagine a new type implementing
+/// `DerefMut` as required, but which also retains the ability (e.g. through
+/// `RefCell`) to mutate the bytes. This would be very bad, but seems hard to
+/// prevent in the type system. Please don't do this.
 ///
 /// You must also use a type `S` whose bytes have a fixed location in memory.
 /// Otherwise moving an instance of `Abomonated<T, S>` may invalidate decoded
@@ -54,8 +58,11 @@ pub struct Abomonated<T, S: DerefMut<Target=[u8]>> {
     decoded: S,
 }
 
-impl<T: Abomonation, S: DerefMut<Target=[u8]>> Abomonated<T, S> {
-
+impl<'s, 't, T, S> Abomonated<T, S>
+    where S: DerefMut<Target=[u8]> + 's,
+          T: Abomonation<'t>,
+          's: 't
+{
     /// Attempts to create decoded data from owned mutable bytes.
     ///
     /// This method will return `None` if it is unable to decode the data with
@@ -94,34 +101,64 @@ impl<T: Abomonation, S: DerefMut<Target=[u8]>> Abomonated<T, S> {
     /// not change if the `bytes: S` instance is moved. Good examples are
     /// `Vec<u8>` whereas bad examples are `[u8; 16]`.
     pub unsafe fn new(mut bytes: S) -> Option<Self> {
+        // Fix type `T`'s inner pointers. Will return `None` on failure.
+        //
+        // FIXME: `slice::from_raw_parts_mut` is used to work around the borrow
+        //        checker marking `bytes` as forever borrowed if `&mut bytes` is
+        //        directly passed as input to `decode()`. But that is itself a
+        //        byproduct of the API contract specified by the `where` clause
+        //        above, which allows S to be `&'t mut [u8]` (and therefore
+        //        require such a perpetual borrow) in the worst case.
+        //
+        //        A different API contract might allow us to achieve the same
+        //        result without resorting to such evil unsafe tricks.
+        //
+        decode::<T>(std::slice::from_raw_parts_mut(bytes.as_mut_ptr(),
+                                                   bytes.len()))?;
 
-        // performs the underlying pointer correction, indicates success.
-        let decoded = decode::<T>(bytes.deref_mut()).is_some();
-
-        if decoded {
-            Some(Abomonated {
-                phantom: PhantomData,
-                decoded: bytes,
-            })
-        }
-        else {
-            None
-        }
+        // Build the Abomonated structure
+        Some(Abomonated {
+            phantom: PhantomData,
+            decoded: bytes,
+        })
     }
 }
 
-impl<T, S: DerefMut<Target=[u8]>> Abomonated<T, S> {
+impl<'t, T, S> Abomonated<T, S>
+    where S: DerefMut<Target=[u8]>,
+          T: Abomonation<'t>
+{
+    /// Get a read-only view on the deserialized bytes
     pub fn as_bytes(&self) -> &[u8] {
         &self.decoded
     }
-}
 
+    /// Get a read-only view on the deserialized data
+    //
+    // NOTE: This method can be safely used even if type T contains references,
+    //       because it makes sure that the borrow of `self` lasts long enough
+    //       to encompass the lifetime of these references.
+    //
+    //       Otherwise, it would be possible to extract an `&'static Something`
+    //       from a short-lived borrow of a `Box<[u8]>`, then drop the `Box`,
+    //       and end up with a dangling reference.
+    //
+    pub fn as_ref<'a: 't>(&'a self) -> &'a T {
+        unsafe { &*(self.decoded.as_ptr() as *const T) }
+    }
+}
 
-impl<T, S: DerefMut<Target=[u8]>> Deref for Abomonated<T, S> {
+// NOTE: The lifetime constraint that was applied to `as_ref()` cannot be
+//       applied to a `Deref` implementation. Therefore, `Deref` can only be
+//       used on types T which do not contain references, as enforced by the
+//       higher-ranked trait bound below.
+impl<T, S> Deref for Abomonated<T, S>
+    where S: DerefMut<Target=[u8]>,
+          for<'t> T: Abomonation<'t>,
+{
     type Target = T;
     #[inline]
     fn deref(&self) -> &T {
-        let result: &T = unsafe { transmute(self.decoded.get_unchecked(0)) };
-        result
+        self.as_ref()
     }
 }
diff --git a/src/align/alloc.rs b/src/align/alloc.rs
new file mode 100644
index 0000000..dcf974c
--- /dev/null
+++ b/src/align/alloc.rs
@@ -0,0 +1,275 @@
+/// Tools for storing abomonated objects with correct alignment
+///
+/// Use of `decode::<T>()` requires that the input bytes are aligned on a
+/// `T::alignment()` boundary, or else undefined behavior will ensue.
+///
+/// This module provides tools for ensuring this alignment constraint on input
+/// bytes of unknown or known-incorrect alignment before calling `decode()`.
+
+use crate::{
+    Entomb,
+    Exhume,
+};
+
+use std::{
+    alloc::{self, Layout},
+    marker::PhantomData,
+    ops::{Deref, DerefMut},
+    ptr::NonNull,
+};
+
+
+/// Overaligned `Box<[u8]>` for abomonated objects of type T
+///
+/// Compared with a regular `Box<[u8]>`, this heap-allocated bag of bytes also
+/// ensures that the heap allocation is aligned on `T::alignment()`, and thus
+/// suitable for use as input to `decode::<T>()`.
+pub struct Coffin<T: Entomb>(NonNull<[u8]>, PhantomData<T>);
+
+impl<T: Entomb> Coffin<T> {
+    /// Copy abomonated bytes into a suitably aligned heap allocation
+    ///
+    /// May abort the computation if memory is exhausted or the system allocator
+    /// is not able to satisfy the size or alignment requirements.
+    pub fn new(bytes: &[u8]) -> Self {
+        // Compute the memory layout of the target memory allocation
+        let size = bytes.len();
+        let layout = Self::layout(size);
+
+        // Handle zero-sized types just like Box does
+        if layout.size() == 0 {
+            return Self (
+                unsafe { std::slice::from_raw_parts_mut(
+                    NonNull::dangling().as_ptr(),
+                    0,
+                ) }.into(),
+                PhantomData,
+            )
+        }
+
+        // Perform the memory allocation using the system allocator. This is
+        // safe because all safety preconditions are checked by Self::layout(),
+        // except for zero-sized allocations which we checked above.
+        let ptr = unsafe { alloc::alloc(layout) };
+
+        // Abort on memory allocation errors the recommended way. Since the
+        // system allocator may abort, no point in not aborting ourselves...
+        if ptr.is_null() { alloc::handle_alloc_error(layout); }
+
+        // Transfer the input bytes on our new allocation. This is safe as...
+        // - `bytes.as_ptr()` has to be valid for `size` by slice construction
+        // - `ptr` is non-null and must point to a memory region of `size` bytes
+        // - Pointers are always byte-aligned, so alignment is irrelevant.
+        // - Heap allocations may not overlap with existing objects.
+        unsafe { ptr.copy_from_nonoverlapping(bytes.as_ptr(), size); }
+
+        // Produce the output slice. The transmute is safe as...
+        // - We don't care about lifetimes as we want a NonNull in the end
+        // - As discussed above, `ptr` is non-null and well-aligned.
+        // - The bytes of the slice have been initialized above
+        Self(unsafe { std::slice::from_raw_parts_mut(ptr, size) }.into(),
+             PhantomData)
+    }
+
+    /// Compute the proper layout for a coffin allocation, checking most safety
+    /// preconditions of the system memory allocator along the way **except for
+    /// the "no zero-sized allocation" requirement**.
+    ///
+    /// We handle errors via panics because they all emerge from edge cases that
+    /// should only be encountered by users actively trying to break this code.
+    fn layout(size: usize) -> Layout {
+        // Basic sanity check for debug builds
+        debug_assert!(size >= std::mem::size_of::<T>(),
+                      "Requested size is quite obviously not big enough");
+
+        // At this point, the only layout errors that remain are those caused by
+        // a bad Abomonation::alignment implementation (alignment is zero or not
+        // a power of 2) or by a huge input size (close to usize::MAX).
+        Layout::from_size_align(size, T::alignment())
+               .expect("Bad Abomonation::alignment() impl or excessive size")
+    }
+}
+
+impl<T: Entomb> Deref for Coffin<T> {
+    type Target = [u8];
+
+    fn deref(&self) -> &Self::Target {
+        // This is safe as...
+        // - The target allocation is live until the Coffin will be dropped.
+        // - Normal borrow-checking rules apply and prevent the user from
+        //   aliasing or retaining the output reference in an invalid way.
+        //
+        // ...but see the Drop documentation for a possible edge case :(
+        unsafe { self.0.as_ref() }
+    }
+}
+
+impl<T: Entomb> DerefMut for Coffin<T> {
+    fn deref_mut(&mut self) -> &mut Self::Target {
+        // This is safe for the same reason that Deref is.
+        unsafe { self.0.as_mut() }
+    }
+}
+
+impl<T: Entomb> Drop for Coffin<T> {
+    fn drop(&mut self) {
+        // In principle, this should be safe for the same reason that DerefMut
+        // is, however there is a wrinkle for all of those...
+        //
+        // If we want any form of Deref to be safe, the Rust compiler must
+        // prevent LLVM from inserting memory reads from the slice after
+        // deallocation, and currently it doesn't.
+        //
+        // There is no clear reason why LLVM would do this, though, and `std`
+        // encounters the same problem everywhere, so we'll take the risk...
+        //
+        // FIXME: Once the Rust team has figured out the right way to handle
+        //        this, use it here if it requires manual action.
+        //
+        //        Here's one ongoing discussion of this topic for reference:
+        //        https://github.com/rust-lang/rust/issues/55005
+        let slice = unsafe { self.0.as_mut() };
+
+        // There is no allocation to deallocate for zero-sized types.
+        if slice.len() == 0 {
+            return;
+        }
+
+        // Deallocate the memory otherwise. This is safe because...
+        // - Every Coffin is always created with its own allocation, only Drop
+        //   can liberate it, and Drop will only be called once.
+        // - Layout is computed in the same way as in `Coffin::new()`, and the
+        //   size of the target slice is the same as that of new's input bytes.
+        unsafe { alloc::dealloc(slice.as_mut_ptr(),
+                                Self::layout(slice.len())); }
+    }
+}
+
+
+/// `Cow`-style abstraction for aligning abomonated bytes before `decode()`
+///
+/// Often, one needs to decode input bytes which are _probably_ well-aligned,
+/// but may not always to be. For example, POSIX memory allocations are aligned
+/// on 16-byte boundaries, which is sufficient for most types... as long as
+/// multiple abomonated objects are not stored in a sequence without padding
+/// bytes in between.
+///
+/// In those circumstances, pessimistically using `Coffin<T>` all the time
+/// would cause unnecessarily intensive use of the system memory allocator.
+/// Instead, it is better to check if the input bytes are well-aligned and only
+/// reallocate them if necessary, which is what this abstraction does.
+pub enum AlignedBytes<'bytes, T: Exhume<'bytes>> {
+    /// The orignal bytes were sufficiently well-aligned
+    Borrowed(&'bytes mut [u8]),
+
+    /// The abomonated bytes were relocated into a well-aligned heap location
+    Owned(Coffin<T>),
+}
+
+impl<'bytes, T: Exhume<'bytes>> AlignedBytes<'bytes, T> {
+    /// Prepare possibly misaligned bytes for decoding
+    pub fn new(bytes: &'bytes mut [u8]) -> Self {
+        let misalignment = (bytes.as_ptr() as usize) % T::alignment();
+        if misalignment == 0 {
+            Self::Borrowed(bytes)
+        } else {
+            Self::Owned(Coffin::new(bytes))
+        }
+    }
+}
+
+impl<'bytes, T: Exhume<'bytes>> From<&'bytes mut [u8]> for AlignedBytes<'bytes, T> {
+    fn from(bytes: &'bytes mut [u8]) -> Self {
+        Self::new(bytes)
+    }
+}
+
+impl<'bytes, T: Exhume<'bytes>> From<Coffin<T>> for AlignedBytes<'bytes, T> {
+    fn from(coffin: Coffin<T>) -> Self {
+        Self::Owned(coffin)
+    }
+}
+
+impl<'bytes, T: Exhume<'bytes>> Deref for AlignedBytes<'bytes, T> {
+    type Target = [u8];
+
+    fn deref(&self) -> &[u8] {
+        match self {
+            Self::Borrowed(b) => b,
+            Self::Owned(o) => o,
+        }
+    }
+}
+
+impl<'bytes, T: Exhume<'bytes>> DerefMut for AlignedBytes<'bytes, T> {
+    fn deref_mut(&mut self) -> &mut [u8] {
+        match self {
+            Self::Borrowed(b) => b,
+            Self::Owned(o) => o,
+        }
+    }
+}
+
+
+#[cfg(test)]
+mod tests {
+    use super::{AlignedBytes, Coffin, Entomb, Exhume};
+
+    #[test]
+    fn coffin() {
+        check_coffin::<u8>();
+        check_coffin::<u16>();
+        check_coffin::<u32>();
+        check_coffin::<u64>();
+        check_coffin::<u128>();
+    }
+
+    fn check_coffin<T: Entomb>() {
+        let bytes = make_test_bytes_for::<T>();
+        let coffin = Coffin::<T>::new(&bytes[..]);
+        assert_eq!(&coffin[..], &bytes[..],
+                   "Coffin data is incorrect");
+        assert_eq!(coffin.as_ptr() as usize % T::alignment(), 0,
+                   "Coffin alignment is not strong enough");
+    }
+
+    #[test]
+    fn aligned_bytes() {
+        check_aligned_bytes::<u16>();
+        check_aligned_bytes::<u32>();
+        check_aligned_bytes::<u64>();
+        check_aligned_bytes::<u128>();
+    }
+
+    fn check_aligned_bytes<T>()
+        where for<'a> T: Exhume<'a>
+    {
+        assert!(std::mem::align_of::<T>() > 1,
+                "This test requires generating misaligned data");
+
+        let mut bytes = make_test_bytes_for::<T>();
+        let mut coffin = Coffin::<T>::new(&bytes[..]);
+        let aligned_bytes = AlignedBytes::<T>::new(&mut coffin[..]);
+        match aligned_bytes {
+            AlignedBytes::Borrowed(_) => {}
+            AlignedBytes::Owned(_) => panic!("Should not allocate here"),
+        }
+        assert_eq!(&aligned_bytes[..], &bytes[..]);
+
+        bytes.push(42);
+        let mut coffin = Coffin::<T>::new(&bytes[..]);
+        let aligned_bytes = AlignedBytes::<T>::new(&mut coffin[1..]);
+        match aligned_bytes {
+            AlignedBytes::Borrowed(_) => panic!("Should allocate here"),
+            AlignedBytes::Owned(_) => {},
+        }
+        assert_eq!(&aligned_bytes[..], &bytes[1..]);
+    }
+
+    fn make_test_bytes_for<T>() -> Vec<u8> {
+        let mut i = 0;
+        std::iter::repeat_with(|| { i += 1; i })
+                  .take(std::mem::size_of::<T>())
+                  .collect::<Vec<_>>()
+    }
+}
diff --git a/src/align/io.rs b/src/align/io.rs
new file mode 100644
index 0000000..b729b78
--- /dev/null
+++ b/src/align/io.rs
@@ -0,0 +1,308 @@
+/// Tools for reading and writing abomonated data in an alignment-aware way
+///
+/// In order to enable UB-free in-place deserialization, abomonated objects
+/// follow Rust's normal memory alignment rules. This requires inserting padding
+/// bytes between serialized data and skipping them on readout. This module
+/// provides tools to take care of this.
+
+use std::{
+    io::Write,
+    mem::{self, MaybeUninit},
+    ptr::NonNull,
+};
+
+
+/// Alignment-aware binary data writer
+///
+/// This wrapper around a standard Rust writer allows writing multiple binary
+/// objects in a sequence with a memory layout that is suitable for in-place
+/// readout. It does so by inserting padding bytes between the objects as if
+/// they were members of a well-aligned C-style struct whose alignment is the
+/// maximum of the alignment of all written objects.
+pub struct AlignedWriter<W: Write> {
+    /// Inner writer to which data is eventually dispatched
+    inner: W,
+
+    /// Amount of data that was sent to the inner writer so far
+    written_so_far: usize,
+
+    /// Expected alignment of the output data
+    #[cfg(debug_assertions)]
+    output_alignment: usize,
+}
+
+impl<W: Write> AlignedWriter<W> {
+    /// Prepare a writer for alignment-aware binary writes
+    ///
+    /// In debug builds, `AlignedWriter` will check that the output memory
+    /// allocation is sufficiently well-aligned for the data that is written
+    /// into it, as per the `output_alignment` parameter to this function.
+    //
+    // FIXME: output_alignment should be #[cfg(debug_assertions)], but at the
+    //        moment Rust 1.39 is a bit too freshly released to rely on that.
+    #[allow(unused)]
+    pub fn new(inner: W, output_alignment: usize) -> Self {
+        Self {
+            inner,
+            written_so_far: 0,
+            #[cfg(debug_assertions)] output_alignment,
+        }
+    }
+
+    /// Write arbitrary binary data into the inner writer
+    ///
+    /// This is unsafe because Rust does not yet provide an UB-free way to
+    /// expose the padding bytes of arbitrary T objects to writers.
+    pub unsafe fn write_slice<T>(&mut self, data: &[T]) -> crate::IOResult<()> {
+        // Check how aligned the binary data needs to be
+        let alignment = mem::align_of_val::<[T]>(data);
+
+        // In debug builds, check that the output allocation has sufficiently
+        // strong alignment for the data that's being written to it.
+        //
+        // If the output alignment is too low, readout may go wrong because the
+        // AlignedReader will skip a number of padding bytes that may not be
+        // in sync with the amount that AlignedWriter has inserted, in a manner
+        // that depends on how the data being read out was _actually_ aligned.
+        #[cfg(debug_assertions)]
+        debug_assert!(
+            alignment <= self.output_alignment,
+            "Insufficient output alignment (output alignment is {}, got data of alignment {})",
+            self.output_alignment, alignment
+        );
+
+        // Inject padding bytes until the output is well-aligned, assuming that
+        // the first byte that was written was well-aligned for all output data.
+        while self.written_so_far % alignment != 0 {
+            self.inner.write_all(&[0u8])?;
+            self.written_so_far += 1;
+        }
+
+        // This is the correct way to reinterpret typed data as bytes, it
+        // accounts for the fact that T may contain padding bytes.
+        let bytes = std::slice::from_raw_parts(
+            data.as_ptr() as *const MaybeUninit<u8>,
+            data.len() * mem::size_of::<T>()
+        );
+
+        // FIXME: Unfortunately, `Write::write_all()` expects initialized
+        //        bytes. This transmute is undefined behavior if T contains
+        //        uninitialized padding bytes.
+        //
+        //        To resolve this UB, we'd need either a "freeze" operation
+        //        that turns uninitialized bytes into arbitrary initialized
+        //        bytes, or a `Write` interface that accepts uninit bytes.
+        //
+        //        See this Rust internals forum topic for more discussion:
+        //        https://internals.rust-lang.org/t/writing-down-binary-data-with-padding-bytes/11197/
+        //
+        self.inner.write_all(mem::transmute::<&[MaybeUninit<u8>], &[u8]>(bytes))?;
+
+        // Keep track of the amount of emitted data and exit
+        self.written_so_far += mem::size_of_val::<[T]>(data);
+        Ok(())
+    }
+
+    /// Convenience function for non-slice data
+    ///
+    /// This is unsafe for the same reason that `write_slice` is.
+    pub unsafe fn write<T>(&mut self, data: &T) -> crate::IOResult<()> {
+        self.write_slice(std::slice::from_ref(data))
+    }
+
+    /// Query how much data was written so far
+    pub fn written_so_far(&self) -> usize {
+        self.written_so_far
+    }
+}
+
+impl<W: Write> Write for AlignedWriter<W> {
+    fn write(&mut self, buf: &[u8]) -> crate::IOResult<usize> {
+        // This will write buf.len() data because bytes are always well-aligned
+        // It is safe because &[u8] has no padding bytes
+        unsafe { self.write_slice(buf)? };
+        Ok(buf.len())
+    }
+
+    fn flush(&mut self) -> crate::IOResult<()> {
+        // No flushing necessary, we don't buffer anything
+        Ok(())
+    }
+}
+
+
+/// Slice-of-bytes reader for data written by `AlignedWriter`
+///
+/// This reader takes as input a bunch of bytes that were written by
+/// `AlignedWriter` and allows fetching back the corresponding binary data under
+/// the assumption that the input bytes are aligned on the max of the alignment
+/// of all the data that was written by `AlignedWriter`.
+pub struct AlignedReader<'bytes> {
+    /// Remaining bytes to be read
+    bytes: &'bytes mut [u8],
+
+    /// Expected alignment of the input data
+    #[cfg(debug_assertions)]
+    input_alignment: usize,
+}
+
+impl<'bytes> AlignedReader<'bytes> {
+    /// Prepare some bytes for alignment-aware readout
+    ///
+    /// In debug builds, `AlignedReader` will check that the input bytes were
+    /// sufficiently well-aligned for the data that is being read from it, as
+    /// per the `input_alignment` parameter to this function.
+    //
+    // FIXME: input_alignment should be #[cfg(debug_assertions)], but at the
+    //        moment Rust 1.39 is a bit too freshly released to rely on that.
+    #[allow(unused)]
+    pub fn new(bytes: &'bytes mut [u8], input_alignment: usize) -> Self {
+        debug_assert_eq!((bytes.as_ptr() as usize) % input_alignment, 0,
+                         "Input data is not aligned on a {}-byte boundary as expected",
+                         input_alignment);
+        Self {
+            bytes,
+            #[cfg(debug_assertions)] input_alignment,
+        }
+    }
+
+    /// Read a slice of data of arbitrary type from the inner bytes, returns a
+    /// pointer to the first element of the slice, or None if the request
+    /// overflows the input bytes.
+    //
+    // FIXME: This should return a NonNull<[T]>, but pointers to slices are not
+    //        ergonomic enough at this point in time.
+    pub fn read_slice<T>(&mut self, len: usize) -> Option<NonNull<T>> {
+        // As far as I know, zero-length slices may be aligned differently but
+        // all nonzero-length slices are aligned identically
+        let alignment = if len == 0 {
+            mem::align_of::<[T; 0]>()
+        } else {
+            mem::align_of::<[T; 1]>()
+        };
+
+        // In debug builds, check that the input allocation has sufficiently
+        // strong alignment for the data that's being read from it.
+        //
+        // If the input alignment is too low, readout may go wrong because the
+        // AlignedReader will skip a number of padding bytes that may not be
+        // in sync with the amount that AlignedWriter has inserted, in a manner
+        // that depends on how the data being read out was _actually_ aligned.
+        #[cfg(debug_assertions)]
+        debug_assert!(
+            alignment <= self.input_alignment,
+            "Insufficient input alignment (input alignment is {}, asked for data of alignment {})",
+            self.input_alignment, alignment
+        );
+
+        // Drop the alignment padding bytes leading up to the inner T-typed data
+        let misalignment = self.bytes.as_ptr() as usize % alignment;
+        if misalignment != 0 {
+            let offset = alignment - misalignment;
+            if offset > self.bytes.len() { return None; }
+            // In an ideal world, one could just write:
+            //     self.bytes = &mut self.bytes[offset..]
+            // Alas, in this world, we need...
+            self.bytes = unsafe {
+                mem::transmute::<&mut [u8], &'bytes mut [u8]>(&mut self.bytes[offset..])
+            };
+        }
+
+        // Make sure that we sill have enough bytes for readout
+        let size = mem::size_of::<T>() * len;
+        if size > self.bytes.len() { return None; }
+
+        // Extract the inner T-typed data
+        // This is safe because we checked that the input size is large enough
+        // and the first pointer of a slice cannot be null
+        let (out, rest) = self.bytes.split_at_mut(size);
+        let result: NonNull<T> = unsafe {
+            NonNull::new_unchecked(out.as_mut_ptr() as *mut T)
+        };
+
+        // Update the inner slice. In an ideal world, one could just write
+        //     self.bytes = rest
+        // Alas, in this world, we need...
+        self.bytes = unsafe {
+            mem::transmute::<&mut [u8], &'bytes mut [u8]>(rest)
+        };
+        Some(result)
+    }
+
+    /// Read arbitrary data from the inner bytes
+    pub fn read<T>(&mut self) -> Option<NonNull<T>> {
+        self.read_slice(1)
+    }
+
+    /// Extract the remaining bytes
+    pub fn remaining(self) -> &'bytes mut [u8] {
+        self.bytes
+    }
+}
+
+
+#[cfg(test)]
+mod tests {
+    use super::{AlignedReader, AlignedWriter};
+
+    #[test]
+    fn round_trip() {
+        // We'll write the following binary data down
+        let u1 = 0x42u8;
+        let u2 = 0x12345678_9abcdef0_u64;
+        let u3s = [0x13579bdf_u32, 0x2468ace0_u32];
+        type UMax = u64;
+        let max_align = std::mem::align_of::<UMax>();
+
+        // Build a writer for it
+        let mut bytes = Vec::new();
+        let mut writer = AlignedWriter::new(&mut bytes, max_align);
+
+        // Write it down
+        unsafe {
+            writer.write(&u1).unwrap();
+            writer.write(&u2).unwrap();
+            writer.write_slice(&u3s[..]).unwrap();
+        }
+
+        // Check written bytes counter
+        let written = writer.written_so_far();
+        std::mem::drop(writer);
+        assert_eq!(written, bytes.len(),
+                   "Number of reported written bytes is wrong");
+        assert_eq!(written, 1 + 7 + 8 + 4 + 4,
+                   "Reported written bytes does not match written data");
+
+        // Check written data
+        assert_eq!(bytes[0], u1,
+                   "8-bit number was written wrong");
+        assert_eq!(bytes[1..8], [0, 0, 0, 0, 0, 0, 0],
+                   "Padding for 64-bit number was written wrong");
+        assert_eq!(bytes[8..16], u2.to_ne_bytes(),
+                   "64-bit number was written wrong");
+        assert_eq!(bytes[16..20], u3s[0].to_ne_bytes(),
+                   "First 32-bit number was written wrong");
+        assert_eq!(bytes[20..24], u3s[1].to_ne_bytes(),
+                   "Second 32-bit number was written wrong");
+
+        // Prepare to read back the data
+        let mut reader = AlignedReader::new(&mut bytes, max_align);
+
+        // Read back the data
+        unsafe {
+            assert_eq!(reader.read::<u8>().unwrap().as_ref(), &u1,
+                       "8-bit number was read wrong");
+            assert_eq!(reader.read::<u64>().unwrap().as_ref(), &u2,
+                       "64-bit number was read wrong");
+            let slice_ptr = reader.read_slice::<u32>(u3s.len()).unwrap();
+            let slice = std::slice::from_raw_parts(slice_ptr.as_ptr(),
+                                                   u3s.len());
+            assert_eq!(slice, &u3s,
+                       "32-bit numbers were read wrong");
+        }
+
+        // Make sure that we consumed all the bytes
+        assert_eq!(reader.remaining(), &[],
+                   "No bytes should remain");
+    }
+}
diff --git a/src/align/mod.rs b/src/align/mod.rs
new file mode 100644
index 0000000..eff9c4f
--- /dev/null
+++ b/src/align/mod.rs
@@ -0,0 +1,9 @@
+/// Utilities for handling alignment in abomonated data
+
+mod io;
+mod alloc;
+
+#[deprecated(note = "Made pub for internal unsafe_abomonate use only")]
+pub use self::io::{AlignedReader, AlignedWriter};
+
+pub use self::alloc::{AlignedBytes, Coffin};
diff --git a/src/lib.rs b/src/lib.rs
index 2e617dc..e5a6485 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -35,21 +35,33 @@
 //! }
 //! ```
 
-use std::mem;       // yup, used pretty much everywhere.
+use std::mem;
 use std::io::Write; // for bytes.write_all; push_all is unstable and extend is slow.
 use std::io::Result as IOResult;
 use std::marker::PhantomData;
 use std::num::*;
+use std::ptr::NonNull;
 
 pub mod abomonated;
+pub mod align;
+
+#[deprecated(note = "Made pub for internal unsafe_abomonate use only")]
+pub use align::{AlignedReader, AlignedWriter};
 
 /// Encodes a typed reference into a binary buffer.
 ///
 /// # Safety
 ///
-/// This method is unsafe because it is unsafe to transmute typed allocations to binary.
-/// Furthermore, Rust currently indicates that it is undefined behavior to observe padding
-/// bytes, which will happen when we `memmcpy` structs which contain padding bytes.
+/// This method is unsafe because Rust currently specifies that it is undefined
+/// behavior to construct an `&[u8]` to padding bytes, which will happen when we
+/// write down binary data of a type T which contains padding bytes as we must
+/// pass down an `&[u8]` to the `Write` API.
+///
+/// Eliminating this UB will require changes to the Rust languages or `std` to
+/// add either of 1/a non-UB way to turn padding bytes into `&[u8]` or 2/a way
+/// to send an `&[MaybeUninit<u8>]` (which allows padding bytes) to a Write
+/// implementation. See the following discussion thread for more info:
+/// https://internals.rust-lang.org/t/writing-down-binary-data-with-padding-bytes/11197/
 ///
 /// # Examples
 /// ```
@@ -70,12 +82,11 @@ pub mod abomonated;
 /// }
 /// ```
 ///
-#[inline]
-pub unsafe fn encode<T: Abomonation, W: Write>(typed: &T, write: &mut W) -> IOResult<()> {
-    let slice = std::slice::from_raw_parts(mem::transmute(typed), mem::size_of::<T>());
-    write.write_all(slice)?;
-    typed.entomb(write)?;
-    Ok(())
+#[inline(always)]
+pub unsafe fn encode<T: Entomb, W: Write>(typed: &T, write: W) -> IOResult<()> {
+    let mut writer = AlignedWriter::new(write, T::alignment());
+    writer.write::<T>(typed)?;
+    T::entomb(typed, &mut writer)
 }
 
 /// Decodes a mutable binary slice into an immutable typed reference.
@@ -87,19 +98,30 @@ pub unsafe fn encode<T: Abomonation, W: Write>(typed: &T, write: &mut W) -> IORe
 ///
 /// # Safety
 ///
-/// The `decode` method is unsafe due to a number of unchecked invariants.
+/// ## Data validity
+///
+/// `decode()` does not check that the input bytes uphold T's validity
+/// invariants. Decoding arbitrary `&[u8]` data can result in invalid
+/// utf8 strings, enums with invalid discriminants, null references, etc. and
+/// some forms of broken invariants are undefined behavior in Rust.
+///
+/// `decode` *does* perform bounds checks, as part of determining if enough data
+/// are present to completely decode, so it should only read and write within
+/// the bounds of its `&mut [u8]` argument. But that only prevents UB for
+/// truncated data, not arbitrary invalid data.
 ///
-/// Decoding arbitrary `&[u8]` data can
-/// result in invalid utf8 strings, enums with invalid discriminants, etc. `decode` *does*
-/// perform bounds checks, as part of determining if enough data are present to completely decode,
-/// and while it should only write within the bounds of its `&mut [u8]` argument, the use of invalid
-/// utf8 and enums are undefined behavior.
+/// Therefore, please do not decode data that was not encoded by the
+/// corresponding encode() implementation.
 ///
-/// Please do not decode data that was not encoded by the corresponding implementation.
+/// ## Alignment
 ///
-/// In addition, `decode` does not ensure that the bytes representing types will be correctly aligned.
-/// On several platforms unaligned reads are undefined behavior, but on several other platforms they
-/// are only a performance penalty.
+/// `decode()` assumes that the input bytes follow the alignment requirements of
+/// abomonated data of type T, which you can check with `T::alignment()`.
+/// Failure to meet this requirement will result in undefined behavior.
+///
+/// If you are not able to guarantee sufficient alignment from your data source, you may find the
+/// `align::AlignedBytes<T>` utility useful. It checks if your data is well-aligned, and moves it
+/// into a well-aligned heap allocation otherwise.
 ///
 /// # Examples
 /// ```
@@ -119,19 +141,12 @@ pub unsafe fn encode<T: Abomonation, W: Write>(typed: &T, write: &mut W) -> IORe
 ///     assert!(remaining.len() == 0);
 /// }
 /// ```
-#[inline]
-pub unsafe fn decode<T: Abomonation>(bytes: &mut [u8]) -> Option<(&T, &mut [u8])> {
-    if bytes.len() < mem::size_of::<T>() { None }
-    else {
-        let (split1, split2) = bytes.split_at_mut(mem::size_of::<T>());
-        let result: &mut T = mem::transmute(split1.get_unchecked_mut(0));
-        if let Some(remaining) = result.exhume(split2) {
-            Some((result, remaining))
-        }
-        else {
-            None
-        }
-    }
+pub unsafe fn decode<'bytes, T>(bytes: &'bytes mut [u8]) -> Option<(&'bytes T, &'bytes mut [u8])>
+    where T: Exhume<'bytes>
+{
+    let mut reader = AlignedReader::new(bytes, T::alignment());
+    let result_ptr = reader.read::<T>()?;
+    Some((T::exhume(result_ptr, &mut reader)?, reader.remaining()))
 }
 
 /// Reports the number of bytes required to encode `self`.
@@ -139,39 +154,106 @@ pub unsafe fn decode<T: Abomonation>(bytes: &mut [u8]) -> Option<(&T, &mut [u8])
 /// # Safety
 ///
 /// The `measure` method is safe. It neither produces nor consults serialized representations.
-#[inline]
-pub fn measure<T: Abomonation>(typed: &T) -> usize {
-    mem::size_of::<T>() + typed.extent()
+pub fn measure<T: Entomb>(typed: &T) -> usize {
+    let mut aligned_sink = AlignedWriter::new(std::io::sink(), T::alignment());
+    unsafe { encode(typed, &mut aligned_sink).expect("Sink should be infaillible"); }
+    aligned_sink.written_so_far()
 }
 
 /// Abomonation provides methods to serialize any heap data the implementor owns.
 ///
+/// The trait's lifetime parameter `'de` represents the set of slices of bytes `&'de mut [u8]`
+/// from which it is valid to deserialize an `&'de impl Abomonation<'de>`. Types which own all of
+/// their data may be deserialized freely, and implement this trait for all `'de`. However, we
+/// need to enforce some deserialization restrictions on types which contain references.
+///
+/// The reason is that abomonation performes in-place deserialization. To do that, it has to
+/// patch a type's reference to point to other serialized data. Where a type _should_ contain an
+/// `&'a T`, abomonation patches that into an `&'de T`. For this substitution to be valid, we
+/// need `'de` to outlive `'a`. Otherwise, a careless user could ask abomonation to deserialize a
+/// `&'static T` and get a `&'de T` which masquerades as an `&'static T` instead. The user could
+/// then copy this reference, drop the bytes, and get use-after-free undefined behavior.
+///
 /// The default implementations for Abomonation's methods are all empty. Many types have no owned
 /// data to transcribe. Some do, however, and need to carefully implement these unsafe methods.
 ///
 /// # Safety
 ///
-/// Abomonation has no safe methods. Please do not call them. They should be called only by
+/// `entomb` and `exhume` are not meant to be called directly. They should be called only by
 /// `encode` and `decode`, each of which impose restrictions on ownership and lifetime of the data
-/// they take as input and return as output.
+/// they take as input and return as output, thus improving safety.
+///
+/// Not all Rust types are abomonable, and one should think carefully about the implications of
+/// implementing `Abomonation` for a type. To lend itself to this exercise, a type must...
+///
+/// - Provide exhaustive access to its internal representation
+/// - Allow reconstruction from said representation
+/// - Survive having its heap allocations being silently replaced by inline pointers to
+///   the same storage block, as long as only a shared reference is observed.
+///
+/// The last point is the reason why `Abomonation` only provides a shared reference to the
+/// reconstructed object. Without this, it would be trivial to trigger, say, a `Box` destructor
+/// that tries to call `free()` on the inner pointer. But the use of a shared reference only
+/// provides minimal sanity, and for types with internal mutability (those with an `UnsafeCell`
+/// inside), this precaution is insufficient. `Abomonation` is generally not safely implementable
+/// for such types, but may work in particular cases like atomics.
 ///
 /// If you are concerned about safety, it may be best to avoid Abomonation all together. It does
 /// several things that may be undefined behavior, depending on how undefined behavior is defined.
-pub trait Abomonation {
+pub unsafe trait Abomonation<'de> : Entomb + Exhume<'de> {}
+unsafe impl<'de, T: Entomb + Exhume<'de>> Abomonation<'de> for T {}
 
+/// Types which can be serialized into bytes by abomonation
+///
+/// Please consult the Abomonation trait's documentation for more details. Most
+/// types which are serializable by abomonation are also deserializable by
+/// abomonation, but we need to have a separate serialization and
+/// deserialization trait for obscure lifetime-related reasons.
+///
+pub unsafe trait Entomb {
     /// Write any additional information about `&self` beyond its binary representation.
     ///
     /// Most commonly this is owned data on the other end of pointers in `&self`. The return value
     /// reports any failures in writing to `write`.
-    #[inline(always)] unsafe fn entomb<W: Write>(&self, _write: &mut W) -> IOResult<()> { Ok(()) }
+    unsafe fn entomb<W: Write>(&self, _write: &mut AlignedWriter<W>) -> IOResult<()> { Ok(()) }
+
+    /// Report the alignment of the complete Abomonation-serialized data
+    fn alignment() -> usize
+        where Self: Sized
+    { mem::align_of::<Self>() }
 
-    /// Recover any information for `&mut self` not evident from its binary representation.
+    /// Version of "alignment" that takes a &self parameter for use in
+    /// declarative macros.
     ///
-    /// Most commonly this populates pointers with valid references into `bytes`.
-    #[inline(always)] unsafe fn exhume<'a,'b>(&'a mut self, bytes: &'b mut [u8]) -> Option<&'b mut [u8]> { Some(bytes) }
+    /// This is _not_ analogous to `mem::align_of_val` and is only intended for
+    /// the internal consumption of the deprecated `unsafe_abomonate` macro.
+    /// Please do not use this trait method in any other code.
+    ///
+    #[deprecated(note="For internal use of unsafe_abomonate only")]
+    fn alignment_from_self_ref(&self) -> usize
+        where Self: Sized
+    { Self::alignment() }
+}
 
-    /// Reports the number of further bytes required to entomb `self`.
-    #[inline(always)] fn extent(&self) -> usize { 0 }
+/// Types which can be deserialized from `&'de mut [u8]` to `&'de T` by abomonation
+///
+/// Please consult the Abomonation trait's documentation for more details. Most
+/// types which are serializable by abomonation are also deserializable by
+/// abomonation, but we need to have a separate serialization and
+/// deserialization trait for obscure lifetime-related reasons.
+///
+pub unsafe trait Exhume<'de> : Entomb + 'de {
+    /// Recover any information for `self_` not evident from its binary representation.
+    ///
+    /// Most commonly this populates pointers with valid references into `bytes`.
+    ///
+    /// Implementors should take note that `self_` is initially in an invalid state, as its inner
+    /// pointers may be dangling. As Rust references come with a data validity invariant, building
+    /// references to invalid state is undefined behavior, so one should strive to implement
+    /// `exhume` using raw pointer operations as much as feasible.
+    //
+    // FIXME: Replace self_ with self once Rust has arbitrary self types
+    unsafe fn exhume(self_: NonNull<Self>, _reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> { Some(&mut *self_.as_ptr()) }
 }
 
 /// The `unsafe_abomonate!` macro takes a type name with an optional list of fields, and implements
@@ -219,22 +301,38 @@ pub trait Abomonation {
 #[deprecated(since="0.5", note="please use the abomonation_derive crate")]
 macro_rules! unsafe_abomonate {
     ($t:ty) => {
-        impl Abomonation for $t { }
+        unsafe impl $crate::Entomb for $t { }
+        unsafe impl $crate::Exhume<'_> for $t { }
     };
     ($t:ty : $($field:ident),*) => {
-        impl Abomonation for $t {
-            #[inline] unsafe fn entomb<W: ::std::io::Write>(&self, write: &mut W) -> ::std::io::Result<()> {
-                $( self.$field.entomb(write)?; )*
+        unsafe impl $crate::Entomb for $t {
+            #[allow(deprecated)]
+            unsafe fn entomb<W: ::std::io::Write>(&self, write: &mut $crate::AlignedWriter<W>) -> ::std::io::Result<()> {
+                $( $crate::Entomb::entomb(&self.$field, write)?; )*
                 Ok(())
             }
-            #[inline] unsafe fn exhume<'a,'b>(&'a mut self, mut bytes: &'b mut [u8]) -> Option<&'b mut [u8]> {
-                $( let temp = bytes; bytes = self.$field.exhume(temp)?; )*
-                Some(bytes)
+
+            #[allow(deprecated)]
+            fn alignment() -> usize {
+                // This is ugly, but I can't think about a better way to do this
+                // in a declarative macro-based code generator...
+                let bad_ref: &Self = unsafe { &*::std::ptr::NonNull::dangling().as_ptr() };
+                let mut align = ::std::mem::align_of::<Self>();
+                $( align = align.max(bad_ref.$field.alignment_from_self_ref()); )*
+                align
             }
-            #[inline] fn extent(&self) -> usize {
-                let mut size = 0;
-                $( size += self.$field.extent(); )*
-                size
+        }
+
+        unsafe impl<'de> $crate::Exhume<'de> for $t {
+            #[allow(deprecated)]
+            unsafe fn exhume(self_: ::std::ptr::NonNull<Self>, reader: &mut $crate::AlignedReader<'de>) -> Option<&'de mut Self> {
+                $(
+                    // FIXME: This (briefly) constructs an &mut _ to invalid data, which is UB.
+                    //        The proposed &raw mut operator would allow avoiding this.
+                    let field_ptr: ::std::ptr::NonNull<_> = From::from(&mut (*self_.as_ptr()).$field);
+                    $crate::Exhume::exhume(field_ptr, reader)?;
+                )*
+                Some(&mut *self_.as_ptr())
             }
         }
     };
@@ -242,108 +340,164 @@ macro_rules! unsafe_abomonate {
 
 // general code for tuples (can't use '0', '1', ... as field identifiers)
 macro_rules! tuple_abomonate {
-    ( $($name:ident)+) => (
-        impl<$($name: Abomonation),*> Abomonation for ($($name,)*) {
+    ( $($ty:ident)+) => (
+        unsafe impl<$($ty: Entomb),*> Entomb for ($($ty,)*) {
             #[allow(non_snake_case)]
-            #[inline(always)] unsafe fn entomb<WRITE: Write>(&self, write: &mut WRITE) -> IOResult<()> {
-                let ($(ref $name,)*) = *self;
-                $($name.entomb(write)?;)*
+            unsafe fn entomb<WRITE: Write>(&self, write: &mut AlignedWriter<WRITE>) -> IOResult<()> {
+                let ($(ref $ty,)*) = *self;
+                $( $ty::entomb($ty, write)?; )*
                 Ok(())
             }
+
             #[allow(non_snake_case)]
-            #[inline(always)] unsafe fn exhume<'a,'b>(&'a mut self, mut bytes: &'b mut [u8]) -> Option<&'b mut [u8]> {
-                let ($(ref mut $name,)*) = *self;
-                $( let temp = bytes; bytes = $name.exhume(temp)?; )*
-                Some(bytes)
+            fn alignment() -> usize {
+                let mut align = mem::align_of::<Self>();
+                $( align = align.max($ty::alignment()); )*
+                align
             }
+        }
+
+        unsafe impl<'de, $($ty: Exhume<'de>),*> Exhume<'de> for ($($ty,)*) {
             #[allow(non_snake_case)]
-            #[inline(always)] fn extent(&self) -> usize {
-                let mut size = 0;
-                let ($(ref $name,)*) = *self;
-                $( size += $name.extent(); )*
-                size
+            unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+                // FIXME: This (briefly) constructs a "ref mut" to invalid data, which is UB.
+                //        I think avoiding this would require a cleaner way to iterate over tuple fields.
+                //        One possibility would be a C++11-style combination of variadic generics and recursion.
+                let ($(ref mut $ty,)*) = *self_.as_ptr();
+                $(
+                    let field_ptr : NonNull<$ty> = From::from($ty);
+                    $ty::exhume(field_ptr, reader)?;
+                )*
+                Some(&mut *self_.as_ptr())
             }
         }
     );
 }
 
-impl Abomonation for u8 { }
-impl Abomonation for u16 { }
-impl Abomonation for u32 { }
-impl Abomonation for u64 { }
-impl Abomonation for u128 { }
-impl Abomonation for usize { }
-
-impl Abomonation for i8 { }
-impl Abomonation for i16 { }
-impl Abomonation for i32 { }
-impl Abomonation for i64 { }
-impl Abomonation for i128 { }
-impl Abomonation for isize { }
-
-impl Abomonation for NonZeroU8 { }
-impl Abomonation for NonZeroU16 { }
-impl Abomonation for NonZeroU32 { }
-impl Abomonation for NonZeroU64 { }
-impl Abomonation for NonZeroU128 { }
-impl Abomonation for NonZeroUsize { }
-
-impl Abomonation for NonZeroI8 { }
-impl Abomonation for NonZeroI16 { }
-impl Abomonation for NonZeroI32 { }
-impl Abomonation for NonZeroI64 { }
-impl Abomonation for NonZeroI128 { }
-impl Abomonation for NonZeroIsize { }
-
-impl Abomonation for f32 { }
-impl Abomonation for f64 { }
-
-impl Abomonation for bool { }
-impl Abomonation for () { }
-
-impl Abomonation for char { }
-
-impl Abomonation for ::std::time::Duration { }
-
-impl<T> Abomonation for PhantomData<T> {}
-
-impl<T: Abomonation> Abomonation for Option<T> {
-    #[inline(always)] unsafe fn entomb<W: Write>(&self, write: &mut W) -> IOResult<()> {
+unsafe impl Entomb for u8 {}
+unsafe impl Exhume<'_> for u8 {}
+unsafe impl Entomb for u16 {}
+unsafe impl Exhume<'_> for u16 {}
+unsafe impl Entomb for u32 {}
+unsafe impl Exhume<'_> for u32 {}
+unsafe impl Entomb for u64 {}
+unsafe impl Exhume<'_> for u64 {}
+unsafe impl Entomb for u128 {}
+unsafe impl Exhume<'_> for u128 {}
+unsafe impl Entomb for usize {}
+unsafe impl Exhume<'_> for usize {}
+
+unsafe impl Entomb for i8 {}
+unsafe impl Exhume<'_> for i8 {}
+unsafe impl Entomb for i16 {}
+unsafe impl Exhume<'_> for i16 {}
+unsafe impl Entomb for i32 {}
+unsafe impl Exhume<'_> for i32 {}
+unsafe impl Entomb for i64 {}
+unsafe impl Exhume<'_> for i64 {}
+unsafe impl Entomb for i128 {}
+unsafe impl Exhume<'_> for i128 {}
+unsafe impl Entomb for isize {}
+unsafe impl Exhume<'_> for isize {}
+
+unsafe impl Entomb for NonZeroU8 {}
+unsafe impl Exhume<'_> for NonZeroU8 {}
+unsafe impl Entomb for NonZeroU16 {}
+unsafe impl Exhume<'_> for NonZeroU16 {}
+unsafe impl Entomb for NonZeroU32 {}
+unsafe impl Exhume<'_> for NonZeroU32 {}
+unsafe impl Entomb for NonZeroU64 {}
+unsafe impl Exhume<'_> for NonZeroU64 {}
+unsafe impl Entomb for NonZeroU128 {}
+unsafe impl Exhume<'_> for NonZeroU128 {}
+unsafe impl Entomb for NonZeroUsize {}
+unsafe impl Exhume<'_> for NonZeroUsize {}
+
+unsafe impl Entomb for NonZeroI8 {}
+unsafe impl Exhume<'_> for NonZeroI8 {}
+unsafe impl Entomb for NonZeroI16 {}
+unsafe impl Exhume<'_> for NonZeroI16 {}
+unsafe impl Entomb for NonZeroI32 {}
+unsafe impl Exhume<'_> for NonZeroI32 {}
+unsafe impl Entomb for NonZeroI64 {}
+unsafe impl Exhume<'_> for NonZeroI64 {}
+unsafe impl Entomb for NonZeroI128 {}
+unsafe impl Exhume<'_> for NonZeroI128 {}
+unsafe impl Entomb for NonZeroIsize {}
+unsafe impl Exhume<'_> for NonZeroIsize {}
+
+unsafe impl Entomb for f32 {}
+unsafe impl Exhume<'_> for f32 {}
+unsafe impl Entomb for f64 {}
+unsafe impl Exhume<'_> for f64 {}
+
+unsafe impl Entomb for bool {}
+unsafe impl Exhume<'_> for bool {}
+unsafe impl Entomb for () {}
+unsafe impl Exhume<'_> for () {}
+
+unsafe impl Entomb for char {}
+unsafe impl Exhume<'_> for char {}
+unsafe impl Entomb for str { fn alignment() -> usize { mem::align_of::<[u8; 1]>() } }
+unsafe impl Exhume<'_> for str {}
+
+unsafe impl Entomb for ::std::time::Duration {}
+unsafe impl Exhume<'_> for ::std::time::Duration {}
+
+unsafe impl<T> Entomb for PhantomData<T> {}
+unsafe impl<'de, T: 'de> Exhume<'de> for PhantomData<T> {}
+
+unsafe impl<T: Entomb> Entomb for Option<T> {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) -> IOResult<()> {
         if let &Some(ref inner) = self {
-            inner.entomb(write)?;
+            T::entomb(inner, write)?;
         }
         Ok(())
     }
-    #[inline(always)] unsafe fn exhume<'a, 'b>(&'a mut self, mut bytes: &'b mut[u8]) -> Option<&'b mut [u8]> {
-        if let &mut Some(ref mut inner) = self {
-            let tmp = bytes; bytes = inner.exhume(tmp)?;
-        }
-        Some(bytes)
+
+    fn alignment() -> usize {
+        mem::align_of::<Self>().max(T::alignment())
     }
-    #[inline] fn extent(&self) -> usize {
-        self.as_ref().map(|inner| inner.extent()).unwrap_or(0)
+}
+unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for Option<T> {
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This (briefly) constructs a "ref mut" to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on enum implementation details.
+        if let Some(ref mut inner) = *self_.as_ptr() {
+            let inner_ptr : NonNull<T> = From::from(inner);
+            T::exhume(inner_ptr, reader)?;
+        }
+        Some(&mut *self_.as_ptr())
     }
 }
 
-impl<T: Abomonation, E: Abomonation> Abomonation for Result<T, E> {
-    #[inline(always)] unsafe fn entomb<W: Write>(&self, write: &mut W) -> IOResult<()> {
-        match self {
-            &Ok(ref inner) => inner.entomb(write)?,
-            &Err(ref inner) => inner.entomb(write)?,
-        };
-        Ok(())
-    }
-    #[inline(always)] unsafe fn exhume<'a, 'b>(&'a mut self, bytes: &'b mut[u8]) -> Option<&'b mut [u8]> {
+unsafe impl<T: Entomb, E: Entomb> Entomb for Result<T, E> {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) -> IOResult<()> {
         match self {
-            &mut Ok(ref mut inner) => inner.exhume(bytes),
-            &mut Err(ref mut inner) => inner.exhume(bytes),
+            &Ok(ref inner) => T::entomb(inner, write),
+            &Err(ref inner) => E::entomb(inner, write),
         }
     }
-    #[inline] fn extent(&self) -> usize {
-        match self {
-            &Ok(ref inner) => inner.extent(),
-            &Err(ref inner) => inner.extent(),
+
+    fn alignment() -> usize {
+        mem::align_of::<Self>().max(T::alignment()).max(E::alignment())
+    }
+}
+unsafe impl<'de, T: Exhume<'de>, E: Exhume<'de>> Exhume<'de> for Result<T, E> {
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This (briefly) constructs a "ref mut" to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on enum implementation details.
+        match *self_.as_ptr() {
+            Ok(ref mut inner) => {
+                let inner_ptr : NonNull<T> = From::from(inner);
+                T::exhume(inner_ptr, reader)?;
+            }
+            Err(ref mut inner) => {
+                let inner_ptr : NonNull<E> = From::from(inner);
+                E::exhume(inner_ptr, reader)?;
+            }
         }
+        Some(&mut *self_.as_ptr())
     }
 }
 
@@ -380,28 +534,41 @@ tuple_abomonate!(A B C D E F G H I J K L M N O P Q R S T U V W X Y Z AA AB AC AD
 tuple_abomonate!(A B C D E F G H I J K L M N O P Q R S T U V W X Y Z AA AB AC AD AE);
 tuple_abomonate!(A B C D E F G H I J K L M N O P Q R S T U V W X Y Z AA AB AC AD AE AF);
 
+unsafe impl<T: Entomb> Entomb for [T] {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) ->  IOResult<()> {
+        for element in self { T::entomb(element, write)?; }
+        Ok(())
+    }
+
+    fn alignment() -> usize {
+        <[T; 1]>::alignment()
+    }
+}
+unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for [T] {
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This constructs an &[T] to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on slice implementation details.
+        let self_len = self_.as_ref().len();
+        exhume_slice(self_.as_ptr() as *mut T, self_len, reader)
+    }
+}
 
 macro_rules! array_abomonate {
     ($size:expr) => (
-        impl<T: Abomonation> Abomonation for [T; $size] {
-            #[inline(always)]
-            unsafe fn entomb<W: Write>(&self, write: &mut W) ->  IOResult<()> {
-                for element in self { element.entomb(write)?; }
-                Ok(())
+        unsafe impl<T: Entomb> Entomb for [T; $size] {
+            unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) ->  IOResult<()> {
+                <[T]>::entomb(&self[..], write)
             }
-            #[inline(always)]
-            unsafe fn exhume<'a, 'b>(&'a mut self, mut bytes: &'b mut[u8]) -> Option<&'b mut [u8]> {
-                for element in self {
-                    let tmp = bytes; bytes = element.exhume(tmp)?;
-                }
-                Some(bytes)
+
+            fn alignment() -> usize {
+                mem::align_of::<Self>().max(T::alignment())
             }
-            #[inline(always)] fn extent(&self) -> usize {
-                let mut size = 0;
-                for element in self {
-                    size += element.extent();
-                }
-                size
+        }
+
+        unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for [T; $size] {
+            unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+                exhume_slice(self_.as_ptr() as *mut T, $size, reader)?;
+                Some(&mut *self_.as_ptr())
             }
         }
     )
@@ -441,97 +608,251 @@ array_abomonate!(30);
 array_abomonate!(31);
 array_abomonate!(32);
 
-impl Abomonation for String {
-    #[inline]
-    unsafe fn entomb<W: Write>(&self, write: &mut W) -> IOResult<()> {
-        write.write_all(self.as_bytes())?;
-        Ok(())
+unsafe impl<'de> Entomb for &'de str {
+    unsafe fn entomb<W: Write>(&self, writer: &mut AlignedWriter<W>) -> IOResult<()> {
+        writer.write_slice(self.as_bytes())
     }
-    #[inline]
-    unsafe fn exhume<'a,'b>(&'a mut self, bytes: &'b mut [u8]) -> Option<&'b mut [u8]> {
-        if self.len() > bytes.len() { None }
-        else {
-            let (mine, rest) = bytes.split_at_mut(self.len());
-            std::ptr::write(self, String::from_raw_parts(mem::transmute(mine.as_ptr()), self.len(), self.len()));
-            Some(rest)
-        }
+
+    fn alignment() -> usize {
+        mem::align_of::<Self>().max(<[u8; 1]>::alignment())
     }
-    #[inline] fn extent(&self) -> usize {
-        self.len()
+}
+unsafe impl<'de> Exhume<'de> for &'de str {
+    #[inline]
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This (briefly) constructs an &str to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on &str implementation details.
+        let self_len = self_.as_ref().len();
+        let s = exhume_str_ref(self_len, reader)?;
+        self_.as_ptr().write(s);
+        Some(&mut *self_.as_ptr())
     }
 }
 
-impl<T: Abomonation> Abomonation for Vec<T> {
+unsafe impl<'de> Entomb for &'de mut str {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) -> IOResult<()> {
+        <&str>::entomb(&self.as_ref(), write)
+    }
+
+    fn alignment() -> usize {
+        <&str>::alignment()
+    }
+}
+unsafe impl<'de> Exhume<'de> for &'de mut str {
     #[inline]
-    unsafe fn entomb<W: Write>(&self, write: &mut W) -> IOResult<()> {
-        write.write_all(typed_to_bytes(&self[..]))?;
-        for element in self.iter() { element.entomb(write)?; }
-        Ok(())
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This (briefly) constructs an &mut str to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on &str implementation details.
+        let self_len = self_.as_ref().len();
+        let s = exhume_str_ref(self_len, reader)?;
+        self_.as_ptr().write(s);
+        Some(&mut *self_.as_ptr())
+    }
+}
+
+unsafe impl Entomb for String {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) -> IOResult<()> {
+        <&str>::entomb(&self.as_ref(), write)
     }
+
+    fn alignment() -> usize {
+        mem::align_of::<Self>().max(<[u8; 1]>::alignment())
+    }
+}
+unsafe impl<'de> Exhume<'de> for String {
     #[inline]
-    unsafe fn exhume<'a,'b>(&'a mut self, bytes: &'b mut [u8]) -> Option<&'b mut [u8]> {
-
-        // extract memory from bytes to back our vector
-        let binary_len = self.len() * mem::size_of::<T>();
-        if binary_len > bytes.len() { None }
-        else {
-            let (mine, mut rest) = bytes.split_at_mut(binary_len);
-            let slice = std::slice::from_raw_parts_mut(mine.as_mut_ptr() as *mut T, self.len());
-            std::ptr::write(self, Vec::from_raw_parts(slice.as_mut_ptr(), self.len(), self.len()));
-            for element in self.iter_mut() {
-                let temp = rest;             // temp variable explains lifetimes (mysterious!)
-                rest = element.exhume(temp)?;
-            }
-            Some(rest)
-        }
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This (briefly) constructs an &String to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on String implementation details.
+        let self_len = self_.as_ref().len();
+        let s = exhume_str_ref(self_len, reader)?;
+        self_.as_ptr().write(String::from_raw_parts(s.as_mut_ptr(), s.len(), s.len()));
+        Some(&mut *self_.as_ptr())
     }
+}
+
+unsafe impl<'de, T: Entomb + 'de> Entomb for &'de [T] {
+    unsafe fn entomb<W: Write>(&self, writer: &mut AlignedWriter<W>) -> IOResult<()> {
+        writer.write_slice::<T>(&self[..])?;
+        <[T]>::entomb(&self[..], writer)
+    }
+
+    fn alignment() -> usize {
+        mem::align_of::<Self>().max(<[T; 1]>::alignment())
+    }
+}
+unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for &'de [T] {
     #[inline]
-    fn extent(&self) -> usize {
-        let mut sum = mem::size_of::<T>() * self.len();
-        for element in self.iter() {
-            sum += element.extent();
-        }
-        sum
+    unsafe fn exhume(self_: NonNull<Self>, bytes: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This (briefly) constructs an &[T] to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on slice implementation details.
+        let self_len = self_.as_ref().len();
+        let s = exhume_slice_ref(self_len, bytes)?;
+        self_.as_ptr().write(s);
+        Some(&mut *self_.as_ptr())
     }
 }
 
-impl<T: Abomonation> Abomonation for Box<T> {
+unsafe impl<'de, T: Entomb> Entomb for &'de mut [T] {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) -> IOResult<()> {
+        <&[T]>::entomb(&&self[..], write)
+    }
+
+    fn alignment() -> usize {
+        <&[T]>::alignment()
+    }
+}
+unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for &'de mut [T] {
     #[inline]
-    unsafe fn entomb<W: Write>(&self, bytes: &mut W) -> IOResult<()> {
-        bytes.write_all(std::slice::from_raw_parts(mem::transmute(&**self), mem::size_of::<T>()))?;
-        (**self).entomb(bytes)?;
-        Ok(())
+    unsafe fn exhume(self_: NonNull<Self>, bytes: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This (briefly) constructs an &mut [T] to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on slice implementation details.
+        let self_len = self_.as_ref().len();
+        let s = exhume_slice_ref(self_len, bytes)?;
+        self_.as_ptr().write(s);
+        Some(&mut *self_.as_ptr())
+    }
+}
+
+unsafe impl<T: Entomb> Entomb for Vec<T> {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) -> IOResult<()> {
+        <&[T]>::entomb(&&self[..], write)
+    }
+
+    fn alignment() -> usize {
+        mem::align_of::<Self>().max(<[T; 1]>::alignment())
     }
+}
+unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for Vec<T> {
     #[inline]
-    unsafe fn exhume<'a,'b>(&'a mut self, bytes: &'b mut [u8]) -> Option<&'b mut [u8]> {
-        let binary_len = mem::size_of::<T>();
-        if binary_len > bytes.len() { None }
-        else {
-            let (mine, mut rest) = bytes.split_at_mut(binary_len);
-            std::ptr::write(self, mem::transmute(mine.as_mut_ptr() as *mut T));
-            let temp = rest; rest = (**self).exhume(temp)?;
-            Some(rest)
-        }
+    unsafe fn exhume(self_: NonNull<Self>, bytes: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        // FIXME: This (briefly) constructs an &Vec<T> to invalid data, which is UB.
+        //        I'm not sure if this can be fully resolved without relying on Vec implementation details.
+        let self_len = self_.as_ref().len();
+        let s = exhume_slice_ref(self_len, bytes)?;
+        self_.as_ptr().write(Vec::from_raw_parts(s.as_mut_ptr(), self_len, self_len));
+        Some(&mut *self_.as_ptr())
+    }
+}
+
+// NOTE: While it might be tempting to decouple 'de from the reference target
+//       and implement Exhume<'de> for &'target T, the two lifetimes actually
+//       have to be exactly the same. Here's proof :
+//
+//       - Deserialization would produce an &'de &'target T. A reference is
+//         only valid if the target is longer-lived, so we need 'target: 'de.
+//       - The deserializer will silently patch &'target T into &'de T. This is
+//         only safe to do if &'de T : &'target T, so we also need 'de: 'target.
+//
+//       If 'target must outlive 'de and 'de must outlive 'target, then the two
+//       lifetimes actually must be exactly the same. Which kind of makes sense:
+//       we start from 'de bytes, and we end up producing references that point
+//       into those same bytes.
+//
+unsafe impl<'de, T: Entomb + 'de> Entomb for &'de T {
+    unsafe fn entomb<W: Write>(&self, writer: &mut AlignedWriter<W>) -> IOResult<()> {
+        writer.write::<T>(&**self)?;
+        T::entomb(&**self, writer)
+    }
+
+    fn alignment() -> usize {
+        mem::align_of::<Self>().max(T::alignment())
+    }
+}
+unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for &'de T {
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        let target = exhume_ref(reader)?;
+        self_.as_ptr().write(target);
+        Some(&mut *self_.as_ptr())
+    }
+}
+
+unsafe impl<'de, T: Entomb> Entomb for &'de mut T {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) -> IOResult<()> {
+        <&T>::entomb(&&**self, write)
+    }
+
+    fn alignment() -> usize {
+        <&T>::alignment()
+    }
+}
+unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for &'de mut T {
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        let target = exhume_ref(reader)?;
+        self_.as_ptr().write(target);
+        Some(&mut *self_.as_ptr())
     }
-    #[inline] fn extent(&self) -> usize {
-        mem::size_of::<T>() + (&**self).extent()
+}
+
+unsafe impl<T: Entomb> Entomb for Box<T> {
+    unsafe fn entomb<W: Write>(&self, write: &mut AlignedWriter<W>) -> IOResult<()> {
+        <&T>::entomb(&self.as_ref(), write)
+    }
+
+    fn alignment() -> usize {
+        mem::align_of::<Self>().max(T::alignment())
+    }
+}
+unsafe impl<'de, T: Exhume<'de>> Exhume<'de> for Box<T> {
+    unsafe fn exhume(self_: NonNull<Self>, reader: &mut AlignedReader<'de>) -> Option<&'de mut Self> {
+        let target = exhume_ref(reader)?;
+        self_.as_ptr().write(Box::from_raw(target as *mut _));
+        Some(&mut *self_.as_ptr())
     }
 }
 
-// This method currently enables undefined behavior, by exposing padding bytes.
-#[inline] unsafe fn typed_to_bytes<T>(slice: &[T]) -> &[u8] {
-    std::slice::from_raw_parts(slice.as_ptr() as *const u8, slice.len() * mem::size_of::<T>())
+// Common subset of "exhume" for all [T]-like types
+// (I'd gladly move this to [T]::exhume, but building a NonNull<[T]> is currently too difficult)
+#[inline]
+unsafe fn exhume_slice<'de, T: Exhume<'de>>(
+    first_ptr: *mut T,
+    length: usize,
+    reader: &mut AlignedReader<'de>
+) -> Option<&'de mut [T]> {
+    for i in 0..length {
+        let element_ptr: NonNull<T> = NonNull::new_unchecked(first_ptr.add(i));
+        T::exhume(element_ptr, reader)?;
+    }
+    Some(std::slice::from_raw_parts_mut(first_ptr, length))
+}
+
+// Common subset of "exhume" for all &[T]-like types
+#[inline]
+unsafe fn exhume_slice_ref<'de, T: Exhume<'de>>(
+    length: usize,
+    reader: &mut AlignedReader<'de>
+) -> Option<&'de mut [T]> {
+    let first_ptr = reader.read_slice::<T>(length)?.as_ptr();
+    exhume_slice(first_ptr, length, reader)
+}
+
+// Common subset of "exhume" for all &mut T-like types
+unsafe fn exhume_ref<'de, T: Exhume<'de>>(reader: &mut AlignedReader<'de>) -> Option<&'de mut T> {
+    let target = reader.read::<T>()?;
+    T::exhume(target, reader)
+}
+
+// Common subset of "exhume" for all &str-like types
+unsafe fn exhume_str_ref<'de>(length: usize, reader: &mut AlignedReader<'de>) -> Option<&'de mut str> {
+    let bytes = exhume_slice_ref::<u8>(length, reader)?;
+    Some(std::str::from_utf8_unchecked_mut(bytes))
 }
 
 mod network {
-    use Abomonation;
+    use super::{Entomb, Exhume};
     use std::net::{SocketAddr, SocketAddrV4, SocketAddrV6, IpAddr, Ipv4Addr, Ipv6Addr};
 
-    impl Abomonation for IpAddr { }
-    impl Abomonation for Ipv4Addr { }
-    impl Abomonation for Ipv6Addr { }
-
-    impl Abomonation for SocketAddr { }
-    impl Abomonation for SocketAddrV4 { }
-    impl Abomonation for SocketAddrV6 { }
-}
\ No newline at end of file
+    unsafe impl Entomb for IpAddr { fn alignment() -> usize { std::mem::align_of::<Self>() } }
+    unsafe impl Exhume<'_> for IpAddr {}
+    unsafe impl Entomb for Ipv4Addr { fn alignment() -> usize { std::mem::align_of::<Self>() } }
+    unsafe impl Exhume<'_> for Ipv4Addr {}
+    unsafe impl Entomb for Ipv6Addr { fn alignment() -> usize { std::mem::align_of::<Self>() } }
+    unsafe impl Exhume<'_> for Ipv6Addr {}
+
+    unsafe impl Entomb for SocketAddr { fn alignment() -> usize { std::mem::align_of::<Self>() } }
+    unsafe impl Exhume<'_> for SocketAddr {}
+    unsafe impl Entomb for SocketAddrV4 { fn alignment() -> usize { std::mem::align_of::<Self>() } }
+    unsafe impl Exhume<'_> for SocketAddrV4 {}
+    unsafe impl Entomb for SocketAddrV6 { fn alignment() -> usize { std::mem::align_of::<Self>() } }
+    unsafe impl Exhume<'_> for SocketAddrV6 {}
+}
diff --git a/tests/tests.rs b/tests/tests.rs
index 340e776..0fec0e4 100644
--- a/tests/tests.rs
+++ b/tests/tests.rs
@@ -1,99 +1,129 @@
 extern crate abomonation;
 
 use abomonation::*;
+use abomonation::align::AlignedBytes;
+use std::fmt::Debug;
 
-#[test] fn test_array() { _test_pass(vec![[0, 1, 2]; 1024]); }
-#[test] fn test_nonzero() { _test_pass(vec![[std::num::NonZeroI32::new(1)]; 1024]); }
-#[test] fn test_opt_vec() { _test_pass(vec![Some(vec![0,1,2]), None]); }
-#[test] fn test_alignment() { _test_pass(vec![(format!("x"), vec![1,2,3]); 1024]); }
-#[test] fn test_alignment_128() { _test_pass(vec![(format!("x"), vec![1u128,2,3]); 1024]); }
-#[test] fn test_option_box_u64() { _test_pass(vec![Some(Box::new(0u64))]); }
-#[test] fn test_option_vec() { _test_pass(vec![Some(vec![0, 1, 2])]); }
-#[test] fn test_u32x4_pass() { _test_pass(vec![((1,2,3),vec![(0u32, 0u32, 0u32, 0u32); 1024])]); }
-#[test] fn test_u64_pass() { _test_pass(vec![0u64; 1024]); }
-#[test] fn test_u128_pass() { _test_pass(vec![0u128; 1024]); }
-#[test] fn test_string_pass() { _test_pass(vec![format!("grawwwwrr!"); 1024]); }
-#[test] fn test_vec_u_s_pass() { _test_pass(vec![vec![(0u64, format!("grawwwwrr!")); 32]; 32]); }
-
-#[test] fn test_u64_fail() { _test_fail(vec![0u64; 1024]); }
-#[test] fn test_u128_fail() { _test_fail(vec![0u128; 1024]); }
-#[test] fn test_string_fail() { _test_fail(vec![format!("grawwwwrr!"); 1024]); }
-#[test] fn test_vec_u_s_fail() { _test_fail(vec![vec![(0u64, format!("grawwwwrr!")); 32]; 32]); }
-
-#[test] fn test_array_size() { _test_size(vec![[0, 1, 2]; 1024]); }
-#[test] fn test_opt_vec_size() { _test_size(vec![Some(vec![0,1,2]), None]); }
-#[test] fn test_alignment_size() { _test_size(vec![(format!("x"), vec![1,2,3]); 1024]); }
-#[test] fn test_option_box_u64_size() { _test_size(vec![Some(Box::new(0u64))]); }
-#[test] fn test_option_vec_size() { _test_size(vec![Some(vec![0, 1, 2])]); }
-#[test] fn test_u32x4_size() { _test_size(vec![((1,2,3),vec![(0u32, 0u32, 0u32, 0u32); 1024])]); }
-#[test] fn test_u64_size() { _test_size(vec![0u64; 1024]); }
-#[test] fn test_u128_size() { _test_size(vec![0u128; 1024]); }
-#[test] fn test_string_size() { _test_size(vec![format!("grawwwwrr!"); 1024]); }
-#[test] fn test_vec_u_s_size() { _test_size(vec![vec![(0u64, format!("grawwwwrr!")); 32]; 32]); }
-
-#[test]
-fn test_phantom_data_for_non_abomonatable_type() {
-    use std::marker::PhantomData;
-    struct NotAbomonatable;
-    _test_pass(PhantomData::<NotAbomonatable>::default());
-}
-
-fn _test_pass<T: Abomonation+Eq>(record: T) {
-    let mut bytes = Vec::new();
-    unsafe { encode(&record, &mut bytes).unwrap(); }
-    {
-        let (result, rest) = unsafe { decode::<T>(&mut bytes[..]) }.unwrap();
-        assert!(&record == result);
-        assert!(rest.len() == 0);
-    }
-}
-
-fn _test_fail<T: Abomonation>(record: T) {
-    let mut bytes = Vec::new();
-    unsafe { encode(&record, &mut bytes).unwrap(); }
-    bytes.pop();
-    assert!(unsafe { decode::<T>(&mut bytes[..]) }.is_none());
-}
-
-fn _test_size<T: Abomonation>(record: T) {
-    let mut bytes = Vec::new();
-    unsafe { encode(&record, &mut bytes).unwrap(); }
-    assert_eq!(bytes.len(), measure(&record));
-}
-
-
-#[derive(Eq, PartialEq)]
+// Test struct for the unsafe_abomonate macro
+#[derive(Clone, Debug, Eq, PartialEq)]
 struct MyStruct {
     a: String,
     b: u64,
     c: Vec<u8>,
 }
-
 unsafe_abomonate!(MyStruct : a, b, c);
 
-#[test]
-fn test_macro() {
-    // create some test data out of abomonation-approved types
-    let record = MyStruct{ a: "test".to_owned(), b: 0, c: vec![0, 1, 2] };
+// Test for PhantomData abomonation, which has no Abomonation bound
+struct NotAbomonatable;
+type PhantomNotAbo = std::marker::PhantomData::<NotAbomonatable>;
+
+// Generic serialization/deserialization testing procedure, add your data here.
+macro_rules! gen_tests {
+    (
+        $( $data:expr => ($pass:ident, $fail:ident, $size:ident) ), *$(,)*
+    ) => {
+        $(
+            #[test] fn $pass() { _test_pass(&mut Vec::new(), vec![$data; 1024]); }
+            #[test] fn $fail() { _test_fail(&mut Vec::new(), vec![$data; 1024]); }
+            #[test] fn $size() { _test_size(&mut Vec::new(), vec![$data; 1024]); }
+        )*
+    };
+}
+gen_tests!{
+    [4, 1, 2] => (test_array_pass,
+                  test_array_fail,
+                  test_array_size),
+
+    std::num::NonZeroI32::new(1) => (test_nonzero_pass,
+                                     test_nonzero_fail,
+                                     test_nonzero_size),
+
+    Some(vec![8, 1, 2]) => (test_option_vec_pass,
+                            test_option_vec_fail,
+                            test_option_vec_size),
+
+    (format!("x"), vec![1, 2, 3])  => (test_alignment_pass,
+                                       test_alignment_fail,
+                                       test_alignment_size),
+
+    (format!("x"), vec![1u128, 2, 3]) => (test_alignment_128_pass,
+                                          test_alignment_128_fail,
+                                          test_alignment_128_size),
+
+    Some(Box::new(9u64)) => (test_option_box_u64_pass,
+                             test_option_box_u64_fail,
+                             test_option_box_u64_size),
+
+    (3u32, 8u32, 1u32, 7u32) => (test_u32x4_pass,
+                                 test_u32x4_fail,
+                                 test_u32x4_size),
+
+    42u64 => (test_u64_pass,
+              test_u64_fail,
+              test_u64_size),
+
+    687u128 => (test_u128_pass,
+                test_u128_fail,
+                test_u128_size),
+
+    format!("grawwwwrr!") => (test_string_pass,
+                              test_string_fail,
+                              test_string_size),
+
+    vec![(0u64, format!("grawwwwrr!")); 32] => (test_vec_u_s_pass,
+                                                test_vec_u_s_fail,
+                                                test_vec_u_s_size),
+
+    MyStruct{ a: "test".to_owned(),
+              b: 0,
+              c: vec![0, 1, 2] } => (test_macro_pass,
+                                     test_macro_fail,
+                                     test_macro_size),
+
+    PhantomNotAbo::default() => (test_phantom_notabo_pass,
+                                 test_phantom_notabo_fail,
+                                 test_phantom_notabo_size),
+
+    Some(&42u64) => (test_ref_u64_pass,
+                     test_ref_u64_fail,
+                     test_ref_u64_size),
+
+    &"grawwwwrr!" => (test_str_pass,
+                      test_str_fail,
+                      test_str_size),
+
+    &[0, 1, 2] => (test_slice_pass,
+                   test_slice_fail,
+                   test_slice_size),
+}
 
-    // encode vector into a Vec<u8>
-    let mut bytes = Vec::new();
+// FIXME: I could not find an API which allows _test_pass to allocate a Vec
+//        internally without restricting the set of allowed Abomonation impls.
+fn _test_pass<'bytes, T>(mut bytes: &'bytes mut Vec<u8>, record: T)
+    where T: Abomonation<'bytes> + Debug + Eq
+{
     unsafe { encode(&record, &mut bytes).unwrap(); }
-
-    // decode a &Vec<(u64, String)> from binary data
-    if let Some((result, rest)) = unsafe { decode::<MyStruct>(&mut bytes) } {
-        assert!(result == &record);
-        assert!(rest.len() == 0);
+    {
+        let (result, rest) = unsafe { decode::<T>(&mut bytes[..]) }.unwrap();
+        assert_eq!(&record, result);
+        assert_eq!(rest.len(), 0);
     }
 }
 
-#[test]
-fn test_macro_size() {
-    // create some test data out of abomonation-approved types
-    let record = MyStruct{ a: "test".to_owned(), b: 0, c: vec![0, 1, 2] };
+// FIXME: I could not find an API which allows _test_fail to allocate a Vec
+//        internally without restricting the set of allowed Abomonation impls.
+fn _test_fail<'bytes, T>(mut bytes: &'bytes mut Vec<u8>, record: T)
+    where T: Abomonation<'bytes> + Debug + Eq
+{
+    unsafe { encode(&record, &mut bytes).unwrap(); }
+    if bytes.pop().is_some() {
+        assert_eq!(unsafe { decode::<T>(&mut bytes[..]) }, None);
+    }
+}
 
-    // encode vector into a Vec<u8>
-    let mut bytes = Vec::new();
+// FIXME: I could not find an API which allows _test_size to allocate a Vec
+//        internally without restricting the set of allowed Abomonation impls.
+fn _test_size<'bytes, T: Abomonation<'bytes>>(mut bytes: &'bytes mut Vec<u8>, record: T) {
     unsafe { encode(&record, &mut bytes).unwrap(); }
     assert_eq!(bytes.len(), measure(&record));
 }
@@ -106,10 +136,20 @@ fn test_multiple_encode_decode() {
     unsafe { encode(&vec![1,2,3], &mut bytes).unwrap(); }
     unsafe { encode(&"grawwwwrr".to_owned(), &mut bytes).unwrap(); }
 
-    let (t, r) = unsafe { decode::<u32>(&mut bytes) }.unwrap(); assert!(*t == 0);
-    let (t, r) = unsafe { decode::<u64>(r) }.unwrap(); assert!(*t == 7);
-    let (t, r) = unsafe { decode::<Vec<i32>>(r) }.unwrap(); assert!(*t == vec![1,2,3]);
-    let (t, _r) = unsafe { decode::<String>(r) }.unwrap(); assert!(*t == "grawwwwrr".to_owned());
+    let (t, r) = unsafe { decode::<u32>(&mut bytes) }.unwrap();
+    assert_eq!(*t, 0);
+
+    let mut r = AlignedBytes::<u64>::new(r);
+    let (t, r) = unsafe { decode::<u64>(&mut r) }.unwrap();
+    assert_eq!(*t, 7);
+
+    let mut r = AlignedBytes::<Vec<i32>>::new(r);
+    let (t, r) = unsafe { decode::<Vec<i32>>(&mut r) }.unwrap();
+    assert_eq!(*t, vec![1,2,3]);
+
+    let mut r = AlignedBytes::<String>::new(r);
+    let (t, _r) = unsafe { decode::<String>(&mut r) }.unwrap();
+    assert_eq!(*t, "grawwwwrr".to_owned());
 }
 
 #[test]
@@ -125,6 +165,36 @@ fn test_net_types() {
     unsafe { encode(&socket_addr4, &mut bytes).unwrap(); }
     unsafe { encode(&socket_addr6, &mut bytes).unwrap(); }
 
-    let (t, r) = unsafe { decode::<SocketAddr>(&mut bytes) }.unwrap(); assert!(*t == socket_addr4);
-    let (t, _r) = unsafe { decode::<SocketAddr>(r) }.unwrap(); assert!(*t == socket_addr6);
+    let (t, r) = unsafe { decode::<SocketAddr>(&mut bytes) }.unwrap(); assert_eq!(*t, socket_addr4);
+    let (t, _r) = unsafe { decode::<SocketAddr>(r) }.unwrap(); assert_eq!(*t, socket_addr6);
+}
+
+#[test]
+fn test_abomonated_owned() {
+  use abomonation::abomonated::Abomonated;
+
+  let s_owned = "This is an owned string".to_owned();
+
+  let mut bytes = Vec::new();
+  unsafe { encode::<String, _>(&s_owned, &mut bytes).unwrap(); }
+
+  let abo = unsafe { Abomonated::<String, _>::new(bytes).unwrap() };
+  assert_eq!(abo.as_ref(), &s_owned);
+  assert_eq!(&*abo, &s_owned);
+}
+
+#[test]
+fn test_abomonated_ref() {
+  use abomonation::abomonated::Abomonated;
+
+  let s_owned = "This is an owned string".to_owned();
+  let s_borrow = &s_owned[11..16];  // "owned"
+
+  let mut bytes = Vec::new();
+  unsafe { encode::<&str, _>(&s_borrow, &mut bytes).unwrap(); }
+
+  let abo = unsafe { Abomonated::<&str, _>::new(bytes).unwrap() };
+  assert_eq!(abo.as_ref(), &s_borrow);
+  // NOTE: Cannot use Deref here because &str contains a reference
+  // FIXME: Figure out a way to add a compile_fail test for this
 }